refactor(snowflake_query): optimize Arrow data processing with explicit row collection (#92)

2025-02-04 15:57:35 -08:00 · 2025-02-04 15:57:35 -08:00 · 0fde90b848
parent d0ff21e10d
commit 0fde90b848
1 changed files with 315 additions and 313 deletions
--- a/api/src/utils/query_engine/data_source_query_routes/snowflake_query.rs
+++ b/api/src/utils/query_engine/data_source_query_routes/snowflake_query.rs
@ -56,12 +56,13 @@ pub async fn snowflake_query(
    let rows = match snowflake_client.exec(&limited_query).await {
        Ok(result) => match result {
            snowflake_api::QueryResult::Arrow(result) => {
-                result
-                    .iter()
-                    .flat_map(|batch| {
+                let mut all_rows = Vec::new();
+                
+                // Process each batch in order
+                for batch in result.iter() {
                    let schema = batch.schema();
-                        (0..batch.num_rows()).map(move |row_idx| {
-                            schema
+                    for row_idx in 0..batch.num_rows() {
+                        let row = schema
                            .fields()
                            .iter()
                            .enumerate()
@ -389,10 +390,11 @@ pub async fn snowflake_query(
                                };
                                (field.name().clone(), data_type)
                            })
-                                .collect::<IndexMap<String, DataType>>()
-                        })
-                    })
-                    .collect()
+                            .collect::<IndexMap<String, DataType>>();
+                        all_rows.push(row);
+                    }
+                }
+                all_rows
            }
            _ => Vec::new(),
        },