{"users":[{"id":1,"username":"admin","name":"Admin","avatar_template":"https://avatars.discourse-cdn.com/v4/letter/a/3ec8ea/{size}.png","admin":true,"moderator":true,"trust_level":4},{"id":26,"username":"Aryan","name":"Aryan","avatar_template":"https://avatars.discourse-cdn.com/v4/letter/a/d78d45/{size}.png","trust_level":1},{"id":21,"username":"Sanskar","name":null,"avatar_template":"https://avatars.discourse-cdn.com/v4/letter/s/3d9bf3/{size}.png","trust_level":1},{"id":9,"username":"Tarika","name":null,"avatar_template":"https://avatars.discourse-cdn.com/v4/letter/t/8491ac/{size}.png","moderator":true,"trust_level":1}],"primary_groups":[],"flair_groups":[],"topic_list":{"can_create_topic":false,"more_topics_url":"/c/faqs/24?page=1","per_page":30,"top_tags":[{"id":15,"name":"file-formats","slug":"file-formats"},{"id":10,"name":"aws-azure-google-sf","slug":"aws-azure-google-sf"},{"id":11,"name":"coalesce-writing-op","slug":"coalesce-writing-op"},{"id":19,"name":"configurations","slug":"configurations"},{"id":6,"name":"connections","slug":"connections"},{"id":16,"name":"databricks-snowflake","slug":"databricks-snowflake"},{"id":18,"name":"data-preparation","slug":"data-preparation"},{"id":12,"name":"installation","slug":"installation"},{"id":20,"name":"machine-learning","slug":"machine-learning"},{"id":14,"name":"schedule","slug":"schedule"},{"id":17,"name":"separator","slug":"separator"},{"id":4,"name":"user-guide","slug":"user-guide"}],"topics":[{"fancy_title":"About the FAQs category","id":201,"title":"About the FAQs category","slug":"about-the-faqs-category","posts_count":1,"reply_count":0,"highest_post_number":1,"image_url":null,"created_at":"2025-12-22T13:10:12.502Z","last_posted_at":"2025-12-22T13:10:12.507Z","bumped":true,"bumped_at":"2025-12-22T13:10:12.502Z","archetype":"regular","unseen":false,"pinned":true,"unpinned":null,"excerpt":"Find quick answers to the most commonly asked questions about Sparkflows. This section covers installation, configuration, features, and common issues to help you get up and running faster.","visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[],"tags_descriptions":{},"views":4,"like_count":0,"has_summary":false,"last_poster_username":"admin","category_id":24,"op_like_count":0,"pinned_globally":false,"featured_link":null,"is_hot":false,"has_accepted_answer":false,"posters":[{"extras":"latest single","description":"Original Poster, Most Recent Poster","user_id":1,"primary_group_id":null,"flair_group_id":null}]},{"fancy_title":"Why does recursive directory search slow down large pipelines?","id":282,"title":"Why does recursive directory search slow down large pipelines?","slug":"why-does-recursive-directory-search-slow-down-large-pipelines","posts_count":1,"reply_count":0,"highest_post_number":1,"image_url":null,"created_at":"2026-01-27T06:37:00.906Z","last_posted_at":"2026-01-27T06:37:00.962Z","bumped":true,"bumped_at":"2026-01-27T06:37:00.962Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"excerpt":"What users observe\nPipelines slow down when recursive directory search is enabled. \n\nWhy this happens\nRecursive search: \n\n\nTraverses every subdirectory \n\n\nEvaluates every file \n\n\nPerforms filesystem metadata calls \n\n\nOn &hellip;","visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[],"tags_descriptions":{},"views":2,"like_count":0,"has_summary":false,"last_poster_username":"Aryan","category_id":24,"op_like_count":0,"pinned_globally":false,"featured_link":null,"is_hot":false,"has_accepted_answer":false,"posters":[{"extras":"latest single","description":"Original Poster, Most Recent Poster","user_id":26,"primary_group_id":null,"flair_group_id":null}]},{"fancy_title":"Why does Read Excel Advanced skip files and sheets in preview mode?","id":281,"title":"Why does Read Excel Advanced skip files and sheets in preview mode?","slug":"why-does-read-excel-advanced-skip-files-and-sheets-in-preview-mode","posts_count":1,"reply_count":0,"highest_post_number":1,"image_url":null,"created_at":"2026-01-27T06:36:35.759Z","last_posted_at":"2026-01-27T06:36:35.809Z","bumped":true,"bumped_at":"2026-01-27T06:36:35.809Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"excerpt":"What users observe\nIn preview: \n\n\nOnly one file is processed \n\n\nOnly one sheet is processed \n\n\n\nWhy this is intentional\nPreview mode runs locally and synchronously. \nTo protect: \n\n\nBrowser responsiveness \n\n\nDeveloper pro&hellip;","visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[],"tags_descriptions":{},"views":2,"like_count":0,"has_summary":false,"last_poster_username":"Aryan","category_id":24,"op_like_count":0,"pinned_globally":false,"featured_link":null,"is_hot":false,"has_accepted_answer":false,"posters":[{"extras":"latest single","description":"Original Poster, Most Recent Poster","user_id":26,"primary_group_id":null,"flair_group_id":null}]},{"fancy_title":"Why is CellRange significantly faster than FullSheet in Read Excel Advanced?","id":280,"title":"Why is CellRange significantly faster than FullSheet in Read Excel Advanced?","slug":"why-is-cellrange-significantly-faster-than-fullsheet-in-read-excel-advanced","posts_count":1,"reply_count":0,"highest_post_number":1,"image_url":null,"created_at":"2026-01-27T06:35:47.120Z","last_posted_at":"2026-01-27T06:35:47.170Z","bumped":true,"bumped_at":"2026-01-27T06:35:47.170Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"excerpt":"What users observe\nCellRange reads are much faster on large Excel files. \n\nWhy this happens\nWith CellRange: \n\n\nOnly required rows are sliced \n\n\nOnly required columns are extracted \n\n\nHeader resolution is localized \n\n\nWit&hellip;","visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[],"tags_descriptions":{},"views":1,"like_count":0,"has_summary":false,"last_poster_username":"Aryan","category_id":24,"op_like_count":0,"pinned_globally":false,"featured_link":null,"is_hot":false,"has_accepted_answer":false,"posters":[{"extras":"latest single","description":"Original Poster, Most Recent Poster","user_id":26,"primary_group_id":null,"flair_group_id":null}]},{"fancy_title":"How can I reliably trace bad values back to the exact Excel cell?","id":279,"title":"How can I reliably trace bad values back to the exact Excel cell?","slug":"how-can-i-reliably-trace-bad-values-back-to-the-exact-excel-cell","posts_count":1,"reply_count":0,"highest_post_number":1,"image_url":null,"created_at":"2026-01-27T06:35:05.231Z","last_posted_at":"2026-01-27T06:35:05.277Z","bumped":true,"bumped_at":"2026-01-27T06:35:05.277Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"excerpt":"The problem\nWithout traceability, bad data becomes impossible to debug. \n\nSparkflows’ approach\nEnable: \n\n\nOutput File Name as Field \n\n\nOutput Sheet Name as Field \n\n\nUse CellRange when applicable \n\n\nTogether, these allow &hellip;","visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[],"tags_descriptions":{},"views":1,"like_count":0,"has_summary":false,"last_poster_username":"Aryan","category_id":24,"op_like_count":0,"pinned_globally":false,"featured_link":null,"is_hot":false,"has_accepted_answer":false,"posters":[{"extras":"latest single","description":"Original Poster, Most Recent Poster","user_id":26,"primary_group_id":null,"flair_group_id":null}]},{"fancy_title":"How does Sparkflows guarantee deterministic schema across many Excel files?","id":278,"title":"How does Sparkflows guarantee deterministic schema across many Excel files?","slug":"how-does-sparkflows-guarantee-deterministic-schema-across-many-excel-files","posts_count":1,"reply_count":0,"highest_post_number":1,"image_url":null,"created_at":"2026-01-27T06:34:40.176Z","last_posted_at":"2026-01-27T06:34:40.218Z","bumped":true,"bumped_at":"2026-01-27T06:34:40.218Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"excerpt":"The core challenge\nExcel files often drift: \n\n\nExtra columns \n\n\nMissing columns \n\n\nSlight type differences \n\n\n\nSparkflows’ strategy\nSparkflows establishes a reference schema from the first successfully read dataset. \nThe&hellip;","visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[],"tags_descriptions":{},"views":1,"like_count":0,"has_summary":false,"last_poster_username":"Aryan","category_id":24,"op_like_count":0,"pinned_globally":false,"featured_link":null,"is_hot":false,"has_accepted_answer":false,"posters":[{"extras":"latest single","description":"Original Poster, Most Recent Poster","user_id":26,"primary_group_id":null,"flair_group_id":null}]},{"fancy_title":"Why does Sparkflows add fileName and sheetName at the very end of Read Excel Advanced?","id":276,"title":"Why does Sparkflows add fileName and sheetName at the very end of Read Excel Advanced?","slug":"why-does-sparkflows-add-filename-and-sheetname-at-the-very-end-of-read-excel-advanced","posts_count":1,"reply_count":0,"highest_post_number":1,"image_url":null,"created_at":"2026-01-27T06:33:45.858Z","last_posted_at":"2026-01-27T06:33:45.909Z","bumped":true,"bumped_at":"2026-01-27T06:33:45.909Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"excerpt":"What users observe\nWhen enabled, fileName and sheetName columns always appear after all data columns, never in the middle. \n\nWhy Sparkflows does this\nSparkflows treats metadata columns as non-data attributes. \nBy design: &hellip;","visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[],"tags_descriptions":{},"views":1,"like_count":0,"has_summary":false,"last_poster_username":"Aryan","category_id":24,"op_like_count":0,"pinned_globally":false,"featured_link":null,"is_hot":false,"has_accepted_answer":false,"posters":[{"extras":"latest single","description":"Original Poster, Most Recent Poster","user_id":26,"primary_group_id":null,"flair_group_id":null}]},{"fancy_title":"Why are invalid comma formats treated as text instead of numbers in Read Excel Advanced?","id":275,"title":"Why are invalid comma formats treated as text instead of numbers in Read Excel Advanced?","slug":"why-are-invalid-comma-formats-treated-as-text-instead-of-numbers-in-read-excel-advanced","posts_count":1,"reply_count":0,"highest_post_number":1,"image_url":null,"created_at":"2026-01-27T06:23:34.207Z","last_posted_at":"2026-01-27T06:23:34.261Z","bumped":true,"bumped_at":"2026-01-27T06:23:34.261Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"excerpt":"What users observe\nSome comma-formatted numbers are parsed, others are not. \n\nWhat Sparkflows supports\nValid formats: \n\n\n1,234,567 \n\n\n1,23,456 \n\n\n-1,23,456.78 \n\n\n(123,456) \n\n\nInvalid formats: \n\n\n12,34,5 \n\n\n1,2,3,456 \n\n\nM&hellip;","visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[],"tags_descriptions":{},"views":1,"like_count":0,"has_summary":false,"last_poster_username":"Aryan","category_id":24,"op_like_count":0,"pinned_globally":false,"featured_link":null,"is_hot":false,"has_accepted_answer":false,"posters":[{"extras":"latest single","description":"Original Poster, Most Recent Poster","user_id":26,"primary_group_id":null,"flair_group_id":null}]},{"fancy_title":"How does Read Excel Advanced handle mixed numeric and text values internally?","id":274,"title":"How does Read Excel Advanced handle mixed numeric and text values internally?","slug":"how-does-read-excel-advanced-handle-mixed-numeric-and-text-values-internally","posts_count":1,"reply_count":0,"highest_post_number":1,"image_url":null,"created_at":"2026-01-27T06:22:56.222Z","last_posted_at":"2026-01-27T06:22:56.274Z","bumped":true,"bumped_at":"2026-01-27T06:22:56.274Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"excerpt":"What users observe\nColumns with mixed values behave inconsistently. \n\nSparkflows’ column-level decision model\nSparkflows makes decisions at the column level, not per cell. \n\n\nIf all sampled values are numeric → numeric t&hellip;","visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[],"tags_descriptions":{},"views":1,"like_count":0,"has_summary":false,"last_poster_username":"Aryan","category_id":24,"op_like_count":0,"pinned_globally":false,"featured_link":null,"is_hot":false,"has_accepted_answer":false,"posters":[{"extras":"latest single","description":"Original Poster, Most Recent Poster","user_id":26,"primary_group_id":null,"flair_group_id":null}]},{"fancy_title":"How does timestamp inference actually work in Read Excel Advanced?","id":272,"title":"How does timestamp inference actually work in Read Excel Advanced?","slug":"how-does-timestamp-inference-actually-work-in-read-excel-advanced","posts_count":1,"reply_count":0,"highest_post_number":1,"image_url":null,"created_at":"2026-01-27T06:21:55.151Z","last_posted_at":"2026-01-27T06:21:55.196Z","bumped":true,"bumped_at":"2026-01-27T06:21:55.196Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"excerpt":"What users observe\nSome columns are inferred as TIMESTAMP instead of STRING. \n\nHow timestamp inference works\nWhen inferDatesAsTimestamp = true: \n\n\nSparkflows samples column values \n\n\nEach value is tested against a set of&hellip;","visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[],"tags_descriptions":{},"views":1,"like_count":0,"has_summary":false,"last_poster_username":"Aryan","category_id":24,"op_like_count":0,"pinned_globally":false,"featured_link":null,"is_hot":false,"has_accepted_answer":false,"posters":[{"extras":"latest single","description":"Original Poster, Most Recent Poster","user_id":26,"primary_group_id":null,"flair_group_id":null}]},{"fancy_title":"How does Sparkflows decide between INTEGER, LONG, and DOUBLE in Read Advanced Excel?","id":270,"title":"How does Sparkflows decide between INTEGER, LONG, and DOUBLE in Read Advanced Excel?","slug":"how-does-sparkflows-decide-between-integer-long-and-double-in-read-advanced-excel","posts_count":1,"reply_count":0,"highest_post_number":1,"image_url":null,"created_at":"2026-01-27T06:20:52.278Z","last_posted_at":"2026-01-27T06:20:52.331Z","bumped":true,"bumped_at":"2026-01-27T06:20:52.331Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"excerpt":"What users observe\nA numeric column is inferred as: \n\n\nINTEGER in some cases \n\n\nLONG in others \n\n\nDOUBLE when decimals appear \n\n\n\nHow Sparkflows decides\nSparkflows uses BigDecimal-based sampling logic to infer numeric ty&hellip;","visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[],"tags_descriptions":{},"views":1,"like_count":0,"has_summary":false,"last_poster_username":"Aryan","category_id":24,"op_like_count":0,"pinned_globally":false,"featured_link":null,"is_hot":false,"has_accepted_answer":false,"posters":[{"extras":"latest single","description":"Original Poster, Most Recent Poster","user_id":26,"primary_group_id":null,"flair_group_id":null}]},{"fancy_title":"Why does Sparkflows rename or suffix my column names automatically?","id":268,"title":"Why does Sparkflows rename or suffix my column names automatically?","slug":"why-does-sparkflows-rename-or-suffix-my-column-names-automatically","posts_count":1,"reply_count":0,"highest_post_number":1,"image_url":null,"created_at":"2026-01-22T06:46:13.901Z","last_posted_at":"2026-01-22T06:46:13.946Z","bumped":true,"bumped_at":"2026-01-22T06:46:13.946Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"excerpt":"Column names are: \n\n\nRenamed \n\n\nSuffixed (_1, _2) \n\n\nAuto-generated (F1, F2) \n\n\n\nWhy this happens\nSparkflows guarantees: \n\n\nValid column identifiers \n\n\nUnique column names \n\n\nSchema-safe output \n\n\nIt automatically: \n\n\nPa&hellip;","visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[],"tags_descriptions":{},"views":1,"like_count":0,"has_summary":false,"last_poster_username":"Aryan","category_id":24,"op_like_count":0,"pinned_globally":false,"featured_link":null,"is_hot":false,"has_accepted_answer":false,"posters":[{"extras":"latest single","description":"Original Poster, Most Recent Poster","user_id":26,"primary_group_id":null,"flair_group_id":null}]},{"fancy_title":"Why did my header shift when using CellRange with PREVIOUS_ROW in Excel Reading?","id":267,"title":"Why did my header shift when using CellRange with PREVIOUS_ROW in Excel Reading?","slug":"why-did-my-header-shift-when-using-cellrange-with-previous-row-in-excel-reading","posts_count":1,"reply_count":0,"highest_post_number":1,"image_url":null,"created_at":"2026-01-22T06:45:41.217Z","last_posted_at":"2026-01-22T06:45:41.263Z","bumped":true,"bumped_at":"2026-01-22T06:45:41.263Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"excerpt":"Headers appear offset or misaligned when using: \n\n\nCellRange \n\n\nPREVIOUS_ROW header option \n\n\n\nWhy this happens\nWith CellRange: \n\n\nData is sliced first \n\n\nHeader resolution depends on range boundaries \n\n\nWhen using PREVI&hellip;","visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[],"tags_descriptions":{},"views":1,"like_count":0,"has_summary":false,"last_poster_username":"Aryan","category_id":24,"op_like_count":0,"pinned_globally":false,"featured_link":null,"is_hot":false,"has_accepted_answer":false,"posters":[{"extras":"latest single","description":"Original Poster, Most Recent Poster","user_id":26,"primary_group_id":null,"flair_group_id":null}]},{"fancy_title":"Why did formula cells become null even though Excel shows values?","id":266,"title":"Why did formula cells become null even though Excel shows values?","slug":"why-did-formula-cells-become-null-even-though-excel-shows-values","posts_count":1,"reply_count":0,"highest_post_number":1,"image_url":null,"created_at":"2026-01-22T06:43:28.080Z","last_posted_at":"2026-01-22T06:43:28.128Z","bumped":true,"bumped_at":"2026-01-22T06:43:28.128Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"excerpt":"Sparkflows explicitly checks for Excel formula errors: \n\n\n#DIV/0! \n\n\n#N/A \n\n\n#VALUE! \n\n\n#REF! \n\n\n#NUM! \n\n\n#SPILL! \n\n\nAny such value is converted to null. \n\nWhy this is intentional\nExcel visually hides errors behind forma&hellip;","visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[],"tags_descriptions":{},"views":1,"like_count":0,"has_summary":false,"last_poster_username":"Aryan","category_id":24,"op_like_count":0,"pinned_globally":false,"featured_link":null,"is_hot":false,"has_accepted_answer":false,"posters":[{"extras":"latest single","description":"Original Poster, Most Recent Poster","user_id":26,"primary_group_id":null,"flair_group_id":null}]},{"fancy_title":"Why did a column suddenly become TIMESTAMP instead of STRING?","id":265,"title":"Why did a column suddenly become TIMESTAMP instead of STRING?","slug":"why-did-a-column-suddenly-become-timestamp-instead-of-string","posts_count":1,"reply_count":0,"highest_post_number":1,"image_url":null,"created_at":"2026-01-22T06:43:04.757Z","last_posted_at":"2026-01-22T06:43:04.801Z","bumped":true,"bumped_at":"2026-01-22T06:43:04.801Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"excerpt":"The engine now supports true timestamp inference. \nWhen inferDatesAsTimestamp = true: \n\n\nSampled values are tested against common date/time formats \n\n\nIf all valid samples match date patterns, the column becomes TIMESTAM&hellip;","visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[],"tags_descriptions":{},"views":2,"like_count":0,"has_summary":false,"last_poster_username":"Aryan","category_id":24,"op_like_count":0,"pinned_globally":false,"featured_link":null,"is_hot":false,"has_accepted_answer":false,"posters":[{"extras":"latest single","description":"Original Poster, Most Recent Poster","user_id":26,"primary_group_id":null,"flair_group_id":null}]},{"fancy_title":"Why are accounting-style numbers like (1,23,456) handled correctly but others are not?","id":264,"title":"Why are accounting-style numbers like (1,23,456) handled correctly but others are not?","slug":"why-are-accounting-style-numbers-like-1-23-456-handled-correctly-but-others-are-not","posts_count":1,"reply_count":0,"highest_post_number":1,"image_url":null,"created_at":"2026-01-22T06:42:41.848Z","last_posted_at":"2026-01-22T06:42:41.891Z","bumped":true,"bumped_at":"2026-01-22T06:42:41.891Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"excerpt":"Sparkflows explicitly supports: \n\n\nWestern grouping: 1,234,567 \n\n\nIndian grouping: 1,23,456 \n\n\nAccounting negatives: (123,456), -(123,456) \n\n\nThese formats are recognized and normalized safely. \n\nWhat is intentionally re&hellip;","visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[],"tags_descriptions":{},"views":2,"like_count":0,"has_summary":false,"last_poster_username":"Aryan","category_id":24,"op_like_count":0,"pinned_globally":false,"featured_link":null,"is_hot":false,"has_accepted_answer":false,"posters":[{"extras":"latest single","description":"Original Poster, Most Recent Poster","user_id":26,"primary_group_id":null,"flair_group_id":null}]},{"fancy_title":"Why did percentages become decimal numbers after reading Excel?","id":263,"title":"Why did percentages become decimal numbers after reading Excel?","slug":"why-did-percentages-become-decimal-numbers-after-reading-excel","posts_count":1,"reply_count":0,"highest_post_number":1,"image_url":null,"created_at":"2026-01-22T06:41:54.101Z","last_posted_at":"2026-01-22T06:41:54.145Z","bumped":true,"bumped_at":"2026-01-22T06:41:54.145Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"excerpt":"Sparkflows normalizes percentages during ingestion: \n\n\n% is a display format, not a data type \n\n\nPercentages are converted to numeric equivalents \n\n\nExample: \n\n\n9.4% → 0.094 \n\n\n100% → 1.0 \n\n\n\nWhy this is correct\nThis ens&hellip;","visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[],"tags_descriptions":{},"views":1,"like_count":0,"has_summary":false,"last_poster_username":"Aryan","category_id":24,"op_like_count":0,"pinned_globally":false,"featured_link":null,"is_hot":false,"has_accepted_answer":false,"posters":[{"extras":"latest single","description":"Original Poster, Most Recent Poster","user_id":26,"primary_group_id":null,"flair_group_id":null}]},{"fancy_title":"Why did Read Excel Advanced infer INTEGER in one file but DOUBLE in another?","id":262,"title":"Why did Read Excel Advanced infer INTEGER in one file but DOUBLE in another?","slug":"why-did-read-excel-advanced-infer-integer-in-one-file-but-double-in-another","posts_count":1,"reply_count":0,"highest_post_number":1,"image_url":null,"created_at":"2026-01-22T06:41:11.722Z","last_posted_at":"2026-01-22T06:41:11.766Z","bumped":true,"bumped_at":"2026-01-22T06:41:11.766Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"excerpt":"Sparkflows uses sample-based inference: \n\n\nSamples a fixed number of rows \n\n\nEvaluates numeric precision \n\n\nChooses the tightest safe type \n\n\nRules: \n\n\nWhole numbers → INTEGER or LONG \n\n\nDecimal values → DOUBLE \n\n\nOverfl&hellip;","visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[],"tags_descriptions":{},"views":2,"like_count":0,"has_summary":false,"last_poster_username":"Aryan","category_id":24,"op_like_count":0,"pinned_globally":false,"featured_link":null,"is_hot":false,"has_accepted_answer":false,"posters":[{"extras":"latest single","description":"Original Poster, Most Recent Poster","user_id":26,"primary_group_id":null,"flair_group_id":null}]},{"fancy_title":"Why did some numeric values turn into null even though Excel shows numbers?","id":261,"title":"Why did some numeric values turn into null even though Excel shows numbers?","slug":"why-did-some-numeric-values-turn-into-null-even-though-excel-shows-numbers","posts_count":1,"reply_count":0,"highest_post_number":1,"image_url":null,"created_at":"2026-01-22T06:40:04.702Z","last_posted_at":"2026-01-22T06:40:04.749Z","bumped":true,"bumped_at":"2026-01-22T06:40:04.749Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"excerpt":"Sparkflows never converts invalid numeric values into strings once a column is inferred as numeric. \nWith the updated engine: \n\n\nValid numeric formats are parsed correctly \n\n\nPercentages, accounting formats, and grouped &hellip;","visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[],"tags_descriptions":{},"views":1,"like_count":0,"has_summary":false,"last_poster_username":"Aryan","category_id":24,"op_like_count":0,"pinned_globally":false,"featured_link":null,"is_hot":false,"has_accepted_answer":false,"posters":[{"extras":"latest single","description":"Original Poster, Most Recent Poster","user_id":26,"primary_group_id":null,"flair_group_id":null}]},{"fancy_title":"How to update a pre-formatted Excel template without breaking formatting","id":256,"title":"How to update a pre-formatted Excel template without breaking formatting","slug":"how-to-update-a-pre-formatted-excel-template-without-breaking-formatting","posts_count":1,"reply_count":0,"highest_post_number":1,"image_url":null,"created_at":"2026-01-15T05:20:59.024Z","last_posted_at":"2026-01-15T05:20:59.071Z","bumped":true,"bumped_at":"2026-01-15T05:20:59.071Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"excerpt":"Problem\nUsers want to update data inside an Excel template that contains: \n\n\nFonts \n\n\nColors \n\n\nBorders \n\n\nCharts \n\n\nFormulas \n\n\nBut regular Excel writers destroy formatting. \n\nSolution\nUse Preserve Formatting in the Sav&hellip;","visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[],"tags_descriptions":{},"views":3,"like_count":0,"has_summary":false,"last_poster_username":"Aryan","category_id":24,"op_like_count":0,"pinned_globally":false,"featured_link":null,"is_hot":false,"has_accepted_answer":false,"posters":[{"extras":"latest single","description":"Original Poster, Most Recent Poster","user_id":26,"primary_group_id":null,"flair_group_id":null}]},{"fancy_title":"Why is my Excel header not being read correctly in Read Excel Advanced?","id":255,"title":"Why is my Excel header not being read correctly in Read Excel Advanced?","slug":"why-is-my-excel-header-not-being-read-correctly-in-read-excel-advanced","posts_count":1,"reply_count":0,"highest_post_number":1,"image_url":null,"created_at":"2026-01-15T05:19:40.407Z","last_posted_at":"2026-01-15T05:19:40.464Z","bumped":true,"bumped_at":"2026-01-15T05:19:40.464Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"excerpt":"Use Header Handling Mode correctly. \nFIRST_ROW\n\n\nUses the first data row as column names. \n\n\nBest when headers are clean and aligned. \n\n\nPREVIOUS_ROW\n\n\nUses the row before data begins. \n\n\nUseful when headers sit just abo&hellip;","visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[],"tags_descriptions":{},"views":4,"like_count":0,"has_summary":false,"last_poster_username":"Aryan","category_id":24,"op_like_count":0,"pinned_globally":false,"featured_link":null,"is_hot":false,"has_accepted_answer":false,"posters":[{"extras":"latest single","description":"Original Poster, Most Recent Poster","user_id":26,"primary_group_id":null,"flair_group_id":null}]},{"fancy_title":"OverwriteFile vs OverwriteSheet vs AppendSheet in Save Excel Advanced","id":254,"title":"OverwriteFile vs OverwriteSheet vs AppendSheet in Save Excel Advanced","slug":"overwritefile-vs-overwritesheet-vs-appendsheet-in-save-excel-advanced","posts_count":1,"reply_count":0,"highest_post_number":1,"image_url":null,"created_at":"2026-01-15T05:15:29.615Z","last_posted_at":"2026-01-15T05:15:29.670Z","bumped":true,"bumped_at":"2026-01-15T05:15:29.670Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"excerpt":"Problem\nUsers often get confused about which Save Mode to use when writing Excel files. Choosing the wrong option can overwrite important sheets or cause duplicate data. \nExplanation\nThe Save Excel Advanced node provides&hellip;","visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[],"tags_descriptions":{},"views":3,"like_count":0,"has_summary":false,"last_poster_username":"Aryan","category_id":24,"op_like_count":0,"pinned_globally":false,"featured_link":null,"is_hot":false,"has_accepted_answer":false,"posters":[{"extras":"latest single","description":"Original Poster, Most Recent Poster","user_id":26,"primary_group_id":null,"flair_group_id":null}]},{"fancy_title":"Select vs Dynamic Select (What’s the Difference?)","id":253,"title":"Select vs Dynamic Select (What’s the Difference?)","slug":"select-vs-dynamic-select-what-s-the-difference","posts_count":1,"reply_count":0,"highest_post_number":1,"image_url":null,"created_at":"2026-01-15T04:35:12.074Z","last_posted_at":"2026-01-15T04:35:12.134Z","bumped":true,"bumped_at":"2026-01-15T04:35:12.134Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"excerpt":"Select Node \n\n\nYou manually pick columns \n\n\nColumn order is either: \n\n\nexactly as listed (propagation OFF), or \n\n\nsame as input data (propagation ON) \n\n\n\n\nBest when your schema is known and stable \n\n\n&hellip;","visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[{"id":4,"name":"user-guide","slug":"user-guide"}],"tags_descriptions":{},"views":4,"like_count":0,"has_summary":false,"last_poster_username":"Sanskar","category_id":24,"op_like_count":0,"pinned_globally":false,"featured_link":null,"is_hot":false,"has_accepted_answer":false,"posters":[{"extras":"latest single","description":"Original Poster, Most Recent Poster","user_id":21,"primary_group_id":null,"flair_group_id":null}]},{"fancy_title":"How Column Order Works in the Select Node","id":252,"title":"How Column Order Works in the Select Node","slug":"how-column-order-works-in-the-select-node","posts_count":1,"reply_count":0,"highest_post_number":1,"image_url":"https://canada1.discourse-cdn.com/flex007/uploads/sparkflows/optimized/1X/9cd9b187f0c5017ec966d0abc19290c6fc811079_2_1024x270.png","created_at":"2026-01-14T05:51:19.328Z","last_posted_at":"2026-01-14T05:51:19.373Z","bumped":true,"bumped_at":"2026-01-14T05:51:19.373Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"excerpt":"It depends on Input Column Propagation. \nPropagation OFF \n\n\nOutput columns appear in exactly the same order as you list them in the Select node. \n\n\nOriginal DataFrame order doesn’t matter. \n\n\nPropagation ON \n\n\nOutput col&hellip;","visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[],"tags_descriptions":{},"views":7,"like_count":0,"has_summary":false,"last_poster_username":"Sanskar","category_id":24,"op_like_count":0,"pinned_globally":false,"featured_link":null,"is_hot":false,"has_accepted_answer":false,"posters":[{"extras":"latest single","description":"Original Poster, Most Recent Poster","user_id":21,"primary_group_id":null,"flair_group_id":null}]},{"fancy_title":"How can we add the complete project specification documentation for the individual projects?","id":218,"title":"How can we add the complete project specification documentation for the individual projects?","slug":"how-can-we-add-the-complete-project-specification-documentation-for-the-individual-projects","posts_count":1,"reply_count":0,"highest_post_number":1,"image_url":"https://canada1.discourse-cdn.com/flex007/uploads/sparkflows/optimized/1X/223c4daeca34c048e6c005af32086df407f8b8bb_2_1024x735.png","created_at":"2025-12-22T14:48:35.400Z","last_posted_at":"2025-12-22T14:48:35.444Z","bumped":true,"bumped_at":"2025-12-22T14:48:35.444Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"excerpt":"Sparkflows provide a feature called Wiki. You can use this feature to list the needs, objectives, expected features, deadlines, budget, outcomes, etc as accurately as possible. \nTo add Wiki for the project management, fo&hellip;","visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[],"tags_descriptions":{},"views":6,"like_count":0,"has_summary":false,"last_poster_username":"Tarika","category_id":24,"op_like_count":0,"pinned_globally":false,"featured_link":null,"is_hot":false,"has_accepted_answer":false,"posters":[{"extras":"latest single","description":"Original Poster, Most Recent Poster","user_id":9,"primary_group_id":null,"flair_group_id":null}]},{"fancy_title":"In Sparkflows is it possible to build a ml model in one machine and use it for prediction in another machine?","id":217,"title":"In Sparkflows is it possible to build a ml model in one machine and use it for prediction in another machine?","slug":"in-sparkflows-is-it-possible-to-build-a-ml-model-in-one-machine-and-use-it-for-prediction-in-another-machine","posts_count":1,"reply_count":0,"highest_post_number":1,"image_url":null,"created_at":"2025-12-22T14:36:41.994Z","last_posted_at":"2025-12-22T14:36:42.046Z","bumped":true,"bumped_at":"2025-12-22T14:36:42.046Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"excerpt":"Yes. It is possible. \nSparkflows supports Spark ML Model Save node using which one can save a model into a file. \nGenerated file can be copied over to another machine. \nSparkflows supports Spark ML Model Load node using &hellip;","visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[{"id":20,"name":"machine-learning","slug":"machine-learning"}],"tags_descriptions":{},"views":4,"like_count":0,"has_summary":false,"last_poster_username":"Tarika","category_id":24,"op_like_count":0,"pinned_globally":false,"featured_link":null,"is_hot":false,"has_accepted_answer":false,"posters":[{"extras":"latest single","description":"Original Poster, Most Recent Poster","user_id":9,"primary_group_id":null,"flair_group_id":null}]},{"fancy_title":"Currently I am performing Data Analysis task using Excel; how easy would it be to migrate to Sparkflows","id":216,"title":"Currently I am performing Data Analysis task using Excel; how easy would it be to migrate to Sparkflows","slug":"currently-i-am-performing-data-analysis-task-using-excel-how-easy-would-it-be-to-migrate-to-sparkflows","posts_count":1,"reply_count":0,"highest_post_number":1,"image_url":null,"created_at":"2025-12-22T14:23:11.163Z","last_posted_at":"2025-12-22T14:23:11.200Z","bumped":true,"bumped_at":"2025-12-22T14:23:11.200Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"excerpt":"Sparkflows provides a huge set of processors to perform different kind of data transformation task. With its less code functionality, migrating to Sparkflows would be smooth and seamless. \nSome of the useful processors i&hellip;","visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[],"tags_descriptions":{},"views":2,"like_count":0,"has_summary":false,"last_poster_username":"Tarika","category_id":24,"op_like_count":0,"pinned_globally":false,"featured_link":null,"is_hot":false,"has_accepted_answer":false,"posters":[{"extras":"latest single","description":"Original Poster, Most Recent Poster","user_id":9,"primary_group_id":null,"flair_group_id":null}]},{"fancy_title":"How can I enable/disable the various modules?","id":215,"title":"How can I enable/disable the various modules?","slug":"how-can-i-enable-disable-the-various-modules","posts_count":1,"reply_count":0,"highest_post_number":1,"image_url":"https://canada1.discourse-cdn.com/flex007/uploads/sparkflows/optimized/1X/cba6b3be79ee042026bfbe58c4caa1e806e53cba_2_1023x475.png","created_at":"2025-12-22T14:17:32.308Z","last_posted_at":"2025-12-22T14:17:32.428Z","bumped":true,"bumped_at":"2025-12-22T14:17:32.428Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"excerpt":"User with Administrative permission can enable/disable the various modules. \nGo to Administration &gt; Configuration &gt; Module:","visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[{"id":19,"name":"configurations","slug":"configurations"}],"tags_descriptions":{},"views":2,"like_count":0,"has_summary":false,"last_poster_username":"Tarika","category_id":24,"op_like_count":0,"pinned_globally":false,"featured_link":null,"is_hot":false,"has_accepted_answer":false,"posters":[{"extras":"latest single","description":"Original Poster, Most Recent Poster","user_id":9,"primary_group_id":null,"flair_group_id":null}]},{"fancy_title":"How Feature Engineering, Data Profiling and Data Cleansing can be performed in Sparkflows?","id":214,"title":"How Feature Engineering, Data Profiling and Data Cleansing can be performed in Sparkflows?","slug":"how-feature-engineering-data-profiling-and-data-cleansing-can-be-performed-in-sparkflows","posts_count":1,"reply_count":0,"highest_post_number":1,"image_url":null,"created_at":"2025-12-22T14:09:47.290Z","last_posted_at":"2025-12-22T14:09:47.345Z","bumped":true,"bumped_at":"2025-12-22T14:09:47.345Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"excerpt":"Following nodes in Sparkflows can help to perform Data Profiling: \n\nCorrelation - It displays relation between dependent and independent features. Relation between features is plotted in Heatmap Graph.\nSummary - It calcu&hellip;","visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[{"id":18,"name":"data-preparation","slug":"data-preparation"}],"tags_descriptions":{},"views":2,"like_count":0,"has_summary":false,"last_poster_username":"Tarika","category_id":24,"op_like_count":0,"pinned_globally":false,"featured_link":null,"is_hot":false,"has_accepted_answer":false,"posters":[{"extras":"latest single","description":"Original Poster, Most Recent Poster","user_id":9,"primary_group_id":null,"flair_group_id":null}]},{"fancy_title":"How does the Sparkflows platform handle multi-user support (i.e. Can user 1 see or edit user 2’s data sources, pipelines, etc)","id":213,"title":"How does the Sparkflows platform handle multi-user support (i.e. Can user 1 see or edit user 2’s data sources, pipelines, etc)","slug":"how-does-the-sparkflows-platform-handle-multi-user-support-i-e-can-user-1-see-or-edit-user-2-s-data-sources-pipelines-etc","posts_count":1,"reply_count":0,"highest_post_number":1,"image_url":null,"created_at":"2025-12-22T14:07:15.637Z","last_posted_at":"2025-12-22T14:07:15.677Z","bumped":true,"bumped_at":"2025-12-22T14:07:15.677Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"excerpt":"Sparkflows supports various user types and enables users to easily share datasets and workflows with each other to foster collaboration.","visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[],"tags_descriptions":{},"views":2,"like_count":0,"has_summary":false,"last_poster_username":"Tarika","category_id":24,"op_like_count":0,"pinned_globally":false,"featured_link":null,"is_hot":false,"has_accepted_answer":false,"posters":[{"extras":"latest single","description":"Original Poster, Most Recent Poster","user_id":9,"primary_group_id":null,"flair_group_id":null}]}]}}