This is an automated email from the ASF dual-hosted git repository.
aglinxinyuan pushed a change to branch xinyuan-loop-feb
in repository https://gitbox.apache.org/repos/asf/texera.git
from aff56110f2 Merge branch 'xinyuan-state-materialization' into
xinyuan-loop-feb
add 43f276e897 refactor(pyamber): collapse DataProcessor per-call
boilerplate (#4685)
add aa82c6a8f6 docs(license): bundle full third-party MIT license texts
(#4942)
add b9c899f32f feat(docker): run service containers as non-root user
(#4941)
add 6b79896f17 chore: upgrade postgresql to 42.7.10 due to CVE (#4420)
add 41a8197022 test(frontend): re-enable 4 user-workflow / dashboard /
list-item specs (#4944)
add b0ee3b72c3 refactor(pyamber): move tests to src/test/python to match
Maven layout (#4945)
add 635f0cf88c test(amber): warm up ReconfigurationIntegrationSpec before
timed assertions (#4947)
add 3c21b7231d chore(deps): bump pillow from 12.1.1 to 12.2.0 in /amber
(#4959)
add 8b5dbf81b6 chore(deps): bump lodash-es from 4.17.21 to 4.18.1 in
/frontend (#4960)
add 34b004d012 fix(amber): surface writer-thread failure as FatalError
instead of silent hang (#4683)
add 933f7fed77 test(frontend): unblock 7 specs from jsdom (#4950)
add 2d6a759a90 refactor(pyamber): flatten over-nested util packages (#4952)
add f36b938892 chore(deps-dev): bump webpack from 5.89.0 to 5.104.1 in
/frontend (#4970)
add 3bb05ab3fa chore(ci): show Codecov carryforward flags in PR comments
(#4973)
add 9fc5b39d96 test(amber): add unit test coverage for NetworkOutputBuffer
(#4958)
add 16d3c6a169 fix(lineChart): prevent NullPointerException when lines is
not configured (#4919)
add b9bbf0db79 fix: admin-adjustable max columns with a clear overflow
message (#4669)
add 6b3af51c9b fix: replace bare Option.get in getPortId with descriptive
IllegalStateException (#4978)
add 8748b14a36 fix: Duplicate JSONToMap in JSONUtils and JSONUtil (#4977)
add ad0def86c6 chore: ignore local .claude/ directory (#4982)
add b4f3a41a2c chore(deps): drop unused content-disposition dependency
(#4980)
add 6832cfa418 chore(deps): drop redundant wheel pin from requirements.txt
(#4860)
add 0609d3d90f chore(deps): refresh LICENSE-binary for transitive version
drift (#4983)
add deb0e2cfc9 refactor(config): drop unused rest-uri key from
storage.conf (#4990)
add 2652315f6c ci: add /request-review and /unrequest-review comment
commands (#4986)
add 75ff07e36a feat(build): bump Scala/Java services to Java 17 LTS (#4938)
add 6f088ab89e fix: don't re-throw in jsdom-svg-polyfill uncaughtException
handler (#4999)
add 7f7bba8601 test: add real test cases for PresetService spec (#4991)
add c1a8d0f07e test(frontend): re-enable two skipped drag-drop tests
(#4971)
add 502287b75d test: add real specs for left-panel SettingsComponent
(#4992)
add c86dc15f3a test: replace placeholder spec with real MenuComponent
tests (#4993)
add 410c700bb5 fix: Removed duplicate Map operator from operator Desc
files (#5005)
add 6f9f0e355d fix(auth): JwtAuthFilter eager-401 with @PermitAll opt-out
(#4903)
add bb78cca44c test: cover Iceberg REST catalog backend in CI (#4276)
add c93c8f7975 test: add test cases for PresetWrapperComponent spec (#5009)
add 23969c789b test: tighten any types in spec mocks to Mocked<T> (#5008)
add bd445b5157 test(frontend): add unit tests for WorkspaceComponent
(#4969)
add 3344022f6f fix: SourceOperator is_source default broken by name
mangling (#5007)
add 0e9c617e23 test(frontend): add Vitest browser mode and re-enable
workflow-editor spec (#5017)
add 2a23ba59d8 chore(pybuilder): aggregate PyBuilder at root and add API
spec for non-macro pieces (#5024)
add b3706cb66c test: add specs for UserConfigService (#5014)
add 14f8be4c08 test(amber): add direct unit tests for WorkflowCompiler
(#5019)
add 62d4489600 fix: Revert "fix(auth): JwtAuthFilter eager-401 with
@PermitAll opt-out" (#5025)
add dcb457e053 test(frontend): expand spec coverage for download /
code-editor / annotation-suggestion (#5004)
add 2b763e442d refactor(amber): rename remaining Akka* identifiers to
Pekko* (#4949)
add 134d7d2785 feat: Add Python Virtual Environment Support: Installing
User Defined Packages (#4902)
add 7879c2a10f docs: move Hugo docs into repo under docs/ (#5000)
add 078ab64d3e feat: Adding a connection pool to reduce the time spent
opening connection to Postgres (#4851)
add b492a622bd ci: enable GitHub merge queue (#5036)
add 1497806fb7 fix: register OneToOnePartition in PartitionInfo
@JsonSubTypes (#5033)
add 5bff1b4e1f fix: align BroadcastPartition routing in LinkConfig with
broadcast semantics (#5032)
add 6b93b121cc chore(deps): bump transformers from 4.57.3 to 5.0.0rc3 in
/amber (#5016)
add ed2f7758f7 fix: preserve ANY type through schema round-trip (#4995)
add df23815633 feat: Add Python Virtual Environment Support: Uninstalling
User Defined Packages (#5035)
add 4862b924d8 feat(amber): reject self-loops and empty/null op-ids in
LogicalLink (with test coverage) (#4956)
add 4f56946c86 test(workflow-core): add unit test coverage for
port-identity serde helpers (#4954)
add 777db47a3b ci: drop bypass_actors from .asf.yaml ruleset (#5047)
add a671e69db7 ci: fix merge queue ruleset payload (#5050)
add bb795a0c8f fix(amber): avoid AtomicInteger.get_and_set deadlock (#5010)
add c58941e1cc fix: close tmp fs and evict udf modules on
ExecutorManager.close() (#5046)
add 30b666eacd fix: assert equal-length worker lists in OneToOne
ChannelConfig (#5031)
add 87eb240ad1 fix: reject non-standard Int bit-widths in ArrowUtils
(#5030)
add bb6b52ba74 fix: reset iteration cursor in OneOnEach.initialize (#5028)
add ac55403592 fix: require non-null decodingMethod in
URLFetcherOpDesc.sourceSchema (#5048)
add 8c077140af fix: return None from getWorkerIndex for non-worker actor
IDs (#5006)
add 09828ea954 feat(k8s): use Lakekeeper as the Iceberg Catalog in the
Kubernetes deployment (#4275)
add 6538e20d7e feat: add eye icon tip to empty result messages (#5061)
add a00e9df405 chore(deps): bump fast-uri from 3.1.0 to 3.1.2 in /frontend
(#5063)
add 7bb102e8fe chore(deps): bump @babel/plugin-transform-modules-systemjs
from 7.29.0 to 7.29.4 in /frontend (#5062)
add 9ba490eea3 feat: add state materialization across regions (#4490)
add 425b589f8d Merge remote-tracking branch 'origin/main' into
xinyuan-loop-feb
No new revisions were added by this update.
Summary of changes:
.asf.yaml | 59 +-
.github/labeler.yml | 8 +-
.github/workflows/auto-queue.yml | 335 --------
.github/workflows/build-and-push-images.yml | 6 +-
.github/workflows/build.yml | 166 +++-
.github/workflows/check-header.yml | 1 +
.github/workflows/comment-commands.yml | 167 ++++
.github/workflows/lint-pr.yml | 5 +
.github/workflows/required-checks.yml | 5 +-
.github/workflows/take-commands.yml | 85 --
.gitignore | 6 +
bin/frontend-dev.sh => .jvmopts | 13 +-
.run/ComputingUnitMaster.run.xml | 1 +
.run/ComputingUnitWorker.run.xml | 1 +
AGENTS.md | 12 +-
LICENSE | 9 +-
access-control-service/LICENSE-binary | 5 +-
amber/LICENSE-binary-java | 5 +-
amber/LICENSE-binary-python | 26 +-
amber/build.sbt | 10 +-
amber/operator-requirements.txt | 4 +-
amber/{src/main/python => }/pyproject.toml | 20 +-
amber/requirements.txt | 1 -
.../handlers/control/assign_port_handler.py | 6 +-
.../core/architecture/managers/executor_manager.py | 16 +-
.../core/architecture/packaging/output_manager.py | 87 +-
amber/src/main/python/core/models/operator.py | 4 +-
amber/src/main/python/core/python_worker.py | 4 +-
.../main/python/core/runnables/data_processor.py | 105 +--
amber/src/main/python/core/runnables/heartbeat.py | 4 +-
.../main/python/core/runnables/network_receiver.py | 2 +-
.../input_port_materialization_reader_runnable.py | 37 +-
...t_input_port_materialization_reader_runnable.py | 190 -----
.../main/python/core/storage/vfs_uri_factory.py | 16 +-
.../main/python/core/util/{thread => }/atomic.py | 2 +-
.../core/util/{protocol => }/base_protocols.py | 0
.../main/python/core/util/buffer/buffer_base.py | 2 +-
.../linked_blocking_multi_queue.py | 2 +-
.../core/util/customized_queue/queue_base.py | 2 +-
.../__init__.py => expression_evaluator.py} | 0
.../src/main/python/core/util/operator/__init__.py | 16 -
.../python/core/util/{runnable => }/runnable.py | 0
.../stoppable/stoppable_queue_blocking_thread.py | 4 +-
amber/src/main/python/core/util/thread/__init__.py | 16 -
.../__init__.py => virtual_identity.py} | 17 +
.../architecture/common/ExecutorDeployment.scala | 10 +-
...ice.scala => PekkoActorRefMappingService.scala} | 2 +-
...aActorService.scala => PekkoActorService.scala} | 2 +-
...ice.scala => PekkoMessageTransferService.scala} | 6 +-
.../engine/architecture/common/WorkflowActor.scala | 10 +-
.../controller/ControllerProcessor.scala | 20 +-
.../controller/ControllerTimerService.scala | 6 +-
.../deploysemantics/deploystrategy/OneOnEach.scala | 1 +
.../messaginglayer/AmberFIFOChannel.scala | 6 +-
.../messaginglayer/OutputManager.scala | 75 +-
.../messaginglayer/WorkerTimerService.scala | 4 +-
.../scheduling/CostBasedScheduleGenerator.scala | 8 +-
.../ExpansionGreedyScheduleGenerator.scala | 4 +-
.../scheduling/RegionExecutionCoordinator.scala | 39 +-
.../scheduling/WorkflowExecutionCoordinator.scala | 10 +-
.../scheduling/config/ChannelConfig.scala | 5 +
.../scheduling/config/LinkConfig.scala | 7 +-
.../scheduling/config/PortConfig.scala | 10 +-
.../engine/architecture/worker/DataProcessor.scala | 3 +-
.../InputPortMaterializationReaderThread.scala | 53 +-
...d.scala => OutputPortStorageWriterThread.scala} | 40 +-
.../worker/managers/SerializationManager.scala | 8 +-
.../worker/promisehandlers/AssignPortHandler.scala | 4 +-
.../InitializeExecutorHandler.scala | 8 +-
.../promisehandlers/UpdateExecutorHandler.scala | 8 +-
.../texera/amber/engine/common/AmberRuntime.scala | 10 +-
.../pythonvirtualenvironment/PveManager.scala | 310 ++++++-
.../pythonvirtualenvironment/PveResource.scala | 49 +-
.../PveWebsocketResource.scala | 30 +-
.../org/apache/texera/workflow/LogicalLink.scala | 13 +
.../e2e/ReconfigurationIntegrationSpec.scala | 64 +-
.../IcebergRestCatalogIntegrationSpec.scala | 82 ++
.../handlers/control/test_debug_command_handler.py | 0
.../control/test_evaluate_expression_handler.py | 0
.../control/test_replay_current_tuple_handler.py | 0
.../control/test_update_executor_handler.py | 0
.../managers/test_console_message_manager.py | 0
.../architecture/managers/test_debug_manager.py | 0
.../test_embedded_control_message_manager.py | 0
.../managers/test_exception_manager.py | 0
.../architecture/managers/test_executor_manager.py | 40 +-
.../architecture/managers/test_pause_manager.py | 0
.../architecture/managers/test_state_manager.py | 0
.../managers/test_state_processing_manager.py | 0
.../managers/test_statistics_manager.py | 0
.../managers/test_tuple_processing_manager.py | 0
.../architecture/packaging/test_output_manager.py | 107 +++
.../packaging/test_state_materialization_e2e.py | 258 ++++++
.../core/architecture/rpc/test_async_rpc_client.py | 0
.../sendsemantics/test_partitioners.py | 0
.../python/core/models/schema/test_schema.py | 0
.../python/core/models/test_operator.py | 25 +-
.../python/core/models/test_state.py | 0
.../python/core/models/test_table.py | 0
.../python/core/models/test_tuple.py | 0
.../python/core/models/type/test_large_binary.py | 0
.../python/core/proxy/test_proxy_client.py | 4 +-
.../python/core/proxy/test_proxy_server.py | 2 +-
.../python/core/runnables/test_console_message.py | 0
.../python/core/runnables/test_data_processor.py | 207 +++++
.../python/core/runnables/test_heartbeat.py | 0
.../python/core/runnables/test_main_loop.py | 137 ++++
.../python/core/runnables/test_network_receiver.py | 0
.../python/core/runnables/test_network_sender.py | 0
.../core/storage/iceberg/test_iceberg_document.py | 45 +-
.../test_iceberg_rest_catalog_integration.py | 70 ++
.../storage/iceberg/test_iceberg_utils_catalog.py | 0
.../iceberg/test_iceberg_utils_large_binary.py | 0
...t_input_port_materialization_reader_runnable.py | 99 +++
.../python/core/storage/test_document_factory.py | 0
amber/src/test/python/core/test_python_worker.py | 125 +++
.../util/console_message/test_replace_print.py | 0
.../core/util/customized_queue/test_inner.py | 0
.../test_linked_blocking_multi_queue.py | 0
.../python/core/util}/test_atomic.py | 28 +-
.../python/core/util}/test_expression_evaluator.py | 2 +-
.../python/core/util}/test_virtual_identity.py | 23 +
.../pytexera/storage/test_dataset_file_document.py | 0
.../storage/test_large_binary_input_stream.py | 0
.../pytexera/storage/test_large_binary_manager.py | 0
.../storage/test_large_binary_output_stream.py | 0
.../udf/examples/test_count_batch_operator.py | 2 +-
.../pytexera/udf/examples/test_echo_operator.py | 2 +-
.../udf/examples/test_echo_table_operator.py | 2 +-
.../udf/examples/test_generator_operator_binary.py | 2 +-
.../examples/test_generator_operator_integer.py | 2 +-
.../deploystrategy/DeployStrategiesSpec.scala | 10 +-
.../logreplay/LogreplayPrimitivesSpec.scala | 2 +-
.../messaginglayer/AmberFIFOChannelSpec.scala | 7 +-
.../messaginglayer/CongestionControlSpec.scala | 2 +-
.../scheduling/RegionCoordinatorTestSupport.scala | 10 +-
.../RegionExecutionCoordinatorSpec.scala | 6 +-
.../WorkflowExecutionCoordinatorSpec.scala | 2 +-
.../scheduling/config/ChannelConfigSpec.scala | 41 +-
.../scheduling/config/LinkConfigSpec.scala | 31 +-
.../partitioners/NetworkOutputBufferSpec.scala | 274 +++++++
.../engine/architecture/worker/WorkerSpec.scala | 2 +-
.../OutputPortStorageWriterThreadSpec.scala | 151 ++++
.../engine/common/CheckpointSubsystemSpec.scala | 2 +-
.../amber/engine/e2e/DataProcessingSpec.scala | 2 +-
.../apache/texera/amber/engine/e2e/PauseSpec.scala | 2 +-
.../amber/engine/e2e/ReconfigurationSpec.scala | 2 +-
.../engine/faulttolerance/CheckpointSpec.scala | 2 +-
.../amber/engine/faulttolerance/LoggingSpec.scala | 2 +-
.../pythonvirtualenvironment/PveResourceSpec.scala | 74 +-
.../apache/texera/workflow/LogicalLinkSpec.scala | 291 +++++++
.../texera/workflow/WorkflowCompilerSpec.scala | 212 +++++
...quirements.txt => system-requirements-lock.txt} | 103 ++-
bin/access-control-service.dockerfile | 11 +-
bin/agent-service.dockerfile | 5 +
bin/computing-unit-master.dockerfile | 11 +-
bin/computing-unit-worker.dockerfile | 11 +-
bin/config-service.dockerfile | 11 +-
bin/file-service.dockerfile | 11 +-
bin/fix-format.sh | 11 +-
bin/k8s/Chart.yaml | 5 +
bin/k8s/files/texera_lakekeeper.sql | 1 +
bin/k8s/templates/external-names.yaml | 8 +-
bin/k8s/templates/lakekeeper-init-job.yaml | 137 ++++
.../templates/postgresql-init-script-config.yaml | 6 +
bin/k8s/templates/webserver-deployment.yaml | 11 +
...workflow-computing-unit-manager-deployment.yaml | 38 +-
bin/k8s/values.yaml | 32 +
bin/texera-web-application.dockerfile | 11 +-
bin/workflow-compiling-service.dockerfile | 11 +-
...flow-computing-unit-managing-service.dockerfile | 11 +-
build.sbt | 27 +-
codecov.yml | 9 +
common/config/src/main/resources/storage.conf | 3 -
.../config/{AkkaConfig.scala => PekkoConfig.scala} | 4 +-
common/dao/build.sbt | 3 +-
.../scala/org/apache/texera/dao/SiteSettings.scala | 57 ++
.../scala/org/apache/texera/dao/SqlServer.scala | 50 +-
.../scala/org/apache/texera/dao/MockTexeraDB.scala | 1 -
.../org/apache/texera/dao/SiteSettingsSpec.scala | 45 ++
.../org/apache/texera/dao/SqlServerSpec.scala | 234 ++++++
.../texera/amber/pybuilder/BoundaryValidator.scala | 52 +-
.../amber/pybuilder/EncodableInspector.scala | 56 +-
.../amber/pybuilder/PythonTemplateBuilder.scala | 336 ++++----
.../pybuilder/PythonTemplateBuilderApiSpec.scala | 247 ++++++
.../pybuilder/PythonTemplateBuilderSpec.scala | 50 +-
common/workflow-core/build.sbt | 2 +-
.../texera/amber/core/storage/VFSURIFactory.scala | 21 +-
.../texera/amber/core/workflow/PartitionInfo.scala | 1 +
.../org/apache/texera/amber/util/ArrowUtils.scala | 41 +-
.../texera/amber/util/VirtualIdentityUtils.scala | 7 +-
.../amber/util/serde/GlobalPortIdentitySerde.scala | 19 +-
.../amber/core/storage/VFSURIFactorySpec.scala | 23 +-
.../amber/core/workflow/PartitionInfoSpec.scala | 22 +-
.../result/iceberg/IcebergDocumentSpec.scala | 10 +-
.../result/iceberg/IcebergTableStatsSpec.scala | 22 +-
.../apache/texera/amber/util/ArrowUtilsSpec.scala | 40 +-
.../amber/util/VirtualIdentityUtilsSpec.scala | 21 +-
.../amber/util/serde/PortIdentitySerdeSpec.scala | 320 ++++++++
.../operator/source/fetcher/URLFetcherOpDesc.scala | 4 +
.../source/scan/csv/CSVScanSourceOpDesc.scala | 7 +-
.../source/scan/csv/CSVScanSourceOpExec.scala | 46 +-
.../source/scan/json/JSONLScanSourceOpExec.scala | 3 +-
.../amber/operator/source/scan/json/JSONUtil.scala | 72 --
.../visualization/DotPlot/DotPlotOpDesc.scala | 1 -
.../IcicleChart/IcicleChartOpDesc.scala | 1 -
.../ImageViz/ImageVisualizerOpDesc.scala | 1 -
.../ScatterMatrixChartOpDesc.scala | 1 -
.../visualization/barChart/BarChartOpDesc.scala | 1 -
.../boxViolinPlot/BoxViolinPlotOpDesc.scala | 1 -
.../bubbleChart/BubbleChartOpDesc.scala | 1 -
.../candlestickChart/CandlestickChartOpDesc.scala | 1 -
.../ContinuousErrorBandsOpDesc.scala | 1 -
.../contourPlot/ContourPlotOpDesc.scala | 1 -
.../dumbbellPlot/DumbbellPlotOpDesc.scala | 1 -
.../FigureFactoryTableOpDesc.scala | 1 -
.../filledAreaPlot/FilledAreaPlotOpDesc.scala | 1 -
.../funnelPlot/FunnelPlotOpDesc.scala | 1 -
.../ganttChart/GanttChartOpDesc.scala | 1 -
.../visualization/heatMap/HeatMapOpDesc.scala | 1 -
.../hierarchychart/HierarchyChartOpDesc.scala | 1 -
.../histogram/HistogramChartOpDesc.scala | 1 -
.../visualization/lineChart/LineChartOpDesc.scala | 4 +-
.../networkGraph/NetworkGraphOpDesc.scala | 1 -
.../visualization/pieChart/PieChartOpDesc.scala | 1 -
.../quiverPlot/QuiverPlotOpDesc.scala | 1 -
.../sankeyDiagram/SankeyDiagramOpDesc.scala | 1 -
.../scatter3DChart/Scatter3dChartOpDesc.scala | 1 -
.../scatterplot/ScatterplotOpDesc.scala | 1 -
.../tablesChart/TablesPlotOpDesc.scala | 1 -
.../ternaryPlot/TernaryPlotOpDesc.scala | 1 -
.../volcanoPlot/VolcanoPlotOpDesc.scala | 1 -
.../waterfallChart/WaterfallChartOpDesc.scala | 1 -
.../source/fetcher/URLFetcherOpDescSpec.scala | 17 +-
.../source/fetcher/URLFetcherOpExecSpec.scala | 3 -
.../source/scan/csv/CSVScanSourceOpExecSpec.scala | 110 +++
.../lineChart/LineChartOpDescSpec.scala | 36 +-
computing-unit-managing-service/LICENSE-binary | 5 +-
config-service/LICENSE-binary | 5 +-
docs/_index.md | 28 +
docs/concepts/_index.md | 38 +
docs/contribution-guidelines/_index.md | 160 ++++
.../apache-license-header.md | 32 +
.../guide-for-developers.md | 357 ++++++++
.../guide-to-frontend-development.md | 52 ++
.../guide-to-implement-java-operator.md | 283 +++++++
.../guide-to-implement-python-operator.md | 91 +++
.../making-contributions.md | 12 +
.../micro-services-local-dev.md | 58 ++
.../release-email-template.md | 90 +++
docs/examples/_index.md | 58 ++
docs/getting-started/AccessLogin.md | 39 +
docs/getting-started/_index.md | 20 +
docs/getting-started/install-texera.md | 10 +
.../getting-started/installing-using-docker.md | 82 +-
docs/getting-started/run-on-kubernetes.md | 137 ++++
docs/getting-started/ui-overview.md | 32 +
docs/overview.md | 43 +
docs/reference/_index.md | 62 ++
docs/reference/configuration.md | 5 +
docs/reference/engine.md | 5 +
docs/reference/frontend.md | 5 +
docs/reference/operators/_index.md | 47 ++
docs/reference/operators/control-block/_index.md | 18 +
docs/reference/operators/control-block/if.md | 22 +
docs/reference/operators/control-block/sleep.md | 21 +
docs/reference/operators/data-cleaning/_index.md | 28 +
.../operators/data-cleaning/aggregate/_index.md | 17 +
.../operators/data-cleaning/aggregate/aggregate.md | 25 +
docs/reference/operators/data-cleaning/distinct.md | 15 +
docs/reference/operators/data-cleaning/filter.md | 24 +
.../operators/data-cleaning/join/_index.md | 19 +
.../data-cleaning/join/cartesian-product.md | 15 +
.../operators/data-cleaning/join/hash-join.md | 23 +
.../operators/data-cleaning/join/interval-join.md | 26 +
docs/reference/operators/data-cleaning/limit.md | 21 +
.../operators/data-cleaning/projection.md | 24 +
.../operators/data-cleaning/set/_index.md | 20 +
.../operators/data-cleaning/set/difference.md | 15 +
.../operators/data-cleaning/set/intersect.md | 15 +
.../data-cleaning/set/symmetricdifference.md | 15 +
.../reference/operators/data-cleaning/set/union.md | 15 +
.../operators/data-cleaning/sort/_index.md | 19 +
.../data-cleaning/sort/sort-partitions.md | 23 +
.../reference/operators/data-cleaning/sort/sort.md | 23 +
.../data-cleaning/sort/stable-merge-sort.md | 23 +
.../operators/data-cleaning/type-casting.md | 23 +
docs/reference/operators/data-input/_index.md | 24 +
.../operators/data-input/arrow-file-scan.md | 23 +
.../operators/data-input/csv-file-scan.md | 26 +
.../operators/data-input/csvold-file-scan.md | 26 +
docs/reference/operators/data-input/file-lister.md | 21 +
.../operators/data-input/file-scan-from-input.md | 27 +
docs/reference/operators/data-input/file-scan.md | 28 +
.../operators/data-input/jsonl-file-scan.md | 25 +
docs/reference/operators/data-input/text-input.md | 25 +
.../operators/database-connector/_index.md | 19 +
.../database-connector/asterixdb-source.md | 45 ++
.../operators/database-connector/mysql-source.md | 36 +
.../database-connector/postgresql-source.md | 36 +
docs/reference/operators/external-api/_index.md | 20 +
.../operators/external-api/reddit-search.md | 25 +
.../twitter-full-archive-search-api.md | 27 +
.../operators/external-api/twitter-search-api.md | 25 +
.../operators/external-api/url-fetcher.md | 22 +
.../reference/operators/machine-learning/_index.md | 17 +
.../machine-learning/advanced-sklearn/_index.md | 20 +
.../advanced-sklearn/knn-classifier.md | 23 +
.../advanced-sklearn/knn-regressor.md | 23 +
.../advanced-sklearn/svm-classifier.md | 23 +
.../advanced-sklearn/svm-regressor.md | 23 +
.../machine-learning/hugging-face/_index.md | 20 +
.../hugging-face-iris-logistic-regression.md | 24 +
.../hugging-face-sentiment-analysis.md | 24 +
.../hugging-face/hugging-face-spam-detection.md | 23 +
.../hugging-face-text-summarization.md | 22 +
.../machine-learning-general/_index.md | 17 +
.../machine-learning-scorer.md | 25 +
.../operators/machine-learning/sklearn/_index.md | 48 ++
.../machine-learning/sklearn/adaptive-boosting.md | 24 +
.../operators/machine-learning/sklearn/bagging.md | 24 +
.../sklearn/bernoulli-naive-bayes.md | 24 +
.../sklearn/complement-naive-bayes.md | 24 +
.../machine-learning/sklearn/decision-tree.md | 24 +
.../machine-learning/sklearn/dummy-classifier.md | 24 +
.../machine-learning/sklearn/extra-tree.md | 24 +
.../machine-learning/sklearn/extra-trees.md | 24 +
.../sklearn/gaussian-naive-bayes.md | 24 +
.../machine-learning/sklearn/gradient-boosting.md | 24 +
.../sklearn/k-nearest-neighbors.md | 24 +
.../machine-learning/sklearn/linear-perceptron.md | 24 +
.../machine-learning/sklearn/linear-regression.md | 22 +
.../sklearn/linear-support-vector-machine.md | 24 +
.../logistic-regression-cross-validation.md | 24 +
.../sklearn/logistic-regression.md | 24 +
.../sklearn/multi-layer-perceptron.md | 24 +
.../sklearn/multinomial-naive-bayes.md | 24 +
.../machine-learning/sklearn/nearest-centroid.md | 24 +
.../machine-learning/sklearn/passive-aggressive.md | 24 +
.../sklearn/probability-calibration.md | 24 +
.../machine-learning/sklearn/random-forest.md | 24 +
.../sklearn/ridge-regression-cross-validation.md | 24 +
.../machine-learning/sklearn/ridge-regression.md | 24 +
.../machine-learning/sklearn/sklearn-prediction.md | 23 +
.../machine-learning/sklearn/sklearn-testing.md | 23 +
.../sklearn/sklearn-training/_index.md | 42 +
.../sklearn-training/training-adaptive-boosting.md | 24 +
.../sklearn-training/training-bagging-training.md | 24 +
.../training-bernoulli-naive-bayes.md | 24 +
.../training-complement-naive-bayes.md | 24 +
.../sklearn-training/training-decision-tree.md | 24 +
.../sklearn-training/training-dummy-classifier.md | 24 +
.../sklearn-training/training-extra-tree.md | 24 +
.../sklearn-training/training-extra-trees.md | 24 +
.../training-gaussian-naive-bayes.md | 24 +
.../sklearn-training/training-gradient-boosting.md | 24 +
.../training-k-nearest-neighbors.md | 24 +
.../sklearn-training/training-linear-perceptron.md | 24 +
.../sklearn-training/training-linear-regression.md | 24 +
.../training-linear-support-vector-machine.md | 24 +
...raining-logistic-regression-cross-validation.md | 24 +
.../training-logistic-regression.md | 24 +
.../training-multi-layer-perceptron.md | 24 +
.../training-multinomial-naive-bayes.md | 24 +
.../sklearn-training/training-nearest-centroid.md | 24 +
.../training-passive-aggressive.md | 24 +
.../training-probability-calibration.md | 24 +
.../sklearn-training/training-random-forest.md | 24 +
.../training-ridge-regression-cross-validation.md | 24 +
.../sklearn-training/training-ridge-regression.md | 24 +
.../training-stochastic-gradient-descent.md | 24 +
.../training-support-vector-machine.md | 24 +
.../sklearn/stochastic-gradient-descent.md | 24 +
.../sklearn/support-vector-machine.md | 24 +
docs/reference/operators/output-modes.md | 24 +
docs/reference/operators/parameters/_index.md | 17 +
.../parameters/sklearn-advanced-knn-parameters.md | 27 +
.../parameters/sklearn-advanced-svc-parameters.md | 26 +
.../parameters/sklearn-advanced-svr-parameters.md | 30 +
docs/reference/operators/search/_index.md | 20 +
.../operators/search/dictionary-matcher.md | 24 +
docs/reference/operators/search/keyword-search.md | 22 +
.../operators/search/regular-expression.md | 23 +
.../reference/operators/search/substring-search.md | 23 +
.../operators/user-defined-functions/_index.md | 16 +
.../user-defined-functions/java/_index.md | 17 +
.../user-defined-functions/java/java-udf.md | 48 ++
.../python/1-out-python-udf.md | 40 +
.../python/2-in-python-udf.md | 56 ++
.../user-defined-functions/python/_index.md | 21 +
.../python/python-lambda-function.md | 24 +
.../python/python-table-reducer.md | 24 +
.../user-defined-functions/python/python-udf.md | 56 ++
.../user-defined-functions/r/1-out-r-udf.md | 43 +
.../operators/user-defined-functions/r/_index.md | 18 +
.../operators/user-defined-functions/r/r-udf.md | 44 +
docs/reference/operators/utilities/_index.md | 20 +
.../operators/utilities/random-k-sampling.md | 21 +
.../operators/utilities/reservoir-sampling.md | 21 +
docs/reference/operators/utilities/split.md | 24 +
.../reference/operators/utilities/unnest-string.md | 23 +
docs/reference/operators/visualization/_index.md | 26 +
.../operators/visualization/advanced/_index.md | 18 +
.../visualization/advanced/choropleth-map.md | 22 +
.../visualization/advanced/scatter3d-chart.md | 23 +
.../operators/visualization/basic/_index.md | 32 +
.../operators/visualization/basic/bar-chart.md | 25 +
.../operators/visualization/basic/bubble-chart.md | 25 +
.../operators/visualization/basic/dot-plot.md | 21 +
.../operators/visualization/basic/dumbbell-plot.md | 28 +
.../visualization/basic/figure-factory-table.md | 25 +
.../visualization/basic/filled-area-plot.md | 26 +
.../operators/visualization/basic/gantt-chart.md | 25 +
.../visualization/basic/hierarchy-chart.md | 24 +
.../operators/visualization/basic/icicle-chart.md | 23 +
.../operators/visualization/basic/line-chart.md | 28 +
.../operators/visualization/basic/pie-chart.md | 22 +
.../operators/visualization/basic/range-slider.md | 23 +
.../visualization/basic/sankey-diagram.md | 23 +
.../operators/visualization/basic/scatter-plot.md | 27 +
.../operators/visualization/basic/tables-plot.md | 22 +
.../visualization/basic/time-series-plot.md | 26 +
.../operators/visualization/financial/_index.md | 21 +
.../visualization/financial/bullet-chart.md | 26 +
.../visualization/financial/candlestick-chart.md | 25 +
.../visualization/financial/funnel-plot.md | 23 +
.../visualization/financial/gauge-chart.md | 26 +
.../visualization/financial/waterfall-chart.md | 22 +
.../operators/visualization/media/_index.md | 20 +
.../visualization/media/html-visualizer.md | 21 +
.../visualization/media/image-visualizer.md | 21 +
.../visualization/media/url-visualizer.md | 21 +
.../operators/visualization/media/word-cloud.md | 22 +
.../operators/visualization/nested-table.md | 24 +
.../operators/visualization/scientific/_index.md | 30 +
.../visualization/scientific/carpet-plot.md | 23 +
.../visualization/scientific/contour-plot.md | 26 +
.../visualization/scientific/dendrogram.md | 24 +
.../operators/visualization/scientific/heatmap.md | 23 +
.../visualization/scientific/network-graph.md | 23 +
.../scientific/parallel-coordinates-plot.md | 22 +
.../visualization/scientific/polar-chart.md | 22 +
.../visualization/scientific/quiver-plot.md | 24 +
.../visualization/scientific/radar-chart.md | 23 +
.../visualization/scientific/radar-plot.md | 28 +
.../visualization/scientific/ternary-contour.md | 24 +
.../visualization/scientific/ternary-plot.md | 25 +
.../visualization/scientific/volcano-plot.md | 22 +
.../visualization/scientific/wind-rose-chart.md | 23 +
.../operators/visualization/statistical/_index.md | 24 +
.../visualization/statistical/boxviolin-plot.md | 24 +
.../statistical/continuous-error-bands.md | 31 +
.../empirical-cumulative-distribution-plot.md | 28 +
.../visualization/statistical/histogram.md | 25 +
.../visualization/statistical/histogram2d.md | 25 +
.../statistical/scatter-matrix-chart.md | 22 +
.../visualization/statistical/strip-chart.md | 24 +
.../visualization/statistical/tree-plot.md | 21 +
docs/reference/project-structure.md | 5 +
docs/reference/storage.md | 5 +
SECURITY.md => docs/security/_index.md | 92 +--
docs/tutorials/_index.md | 68 ++
docs/tutorials/create-dataset-upload-data.md | 35 +
docs/tutorials/guide-for-how-to-use-texera.md | 46 ++
docs/tutorials/guide-to-enable-llm-agent.md | 96 +++
docs/tutorials/guide-to-launch-lakekeeper.md | 119 +++
docs/tutorials/guide-to-use-python-udf.md | 164 ++++
docs/tutorials/migrate-jupyter-notebook.md | 190 +++++
file-service/LICENSE-binary | 5 +-
.../texera/service/resource/DatasetResource.scala | 16 +-
frontend/.gitignore | 3 +
frontend/LICENSE-binary | 10 +-
frontend/angular.json | 29 +-
frontend/package.json | 15 +-
.../preset-wrapper.component.spec.ts | 578 +++++++------
.../user/config/user-config.service.spec.ts | 317 +++++---
.../admin/settings/admin-settings.component.html | 33 +
.../admin/settings/admin-settings.component.ts | 37 +-
.../component/dashboard.component.spec.ts | 20 +-
.../user/list-item/list-item.component.spec.ts | 9 +-
.../user-computing-unit.component.spec.ts | 5 +-
.../user-project-list-item.component.spec.ts | 39 +-
.../user/user-quota/user-quota.component.spec.ts | 5 +-
.../user-workflow-list-item.component.spec.ts | 42 +-
.../user-workflow/user-workflow.component.html | 1 -
.../user-workflow/user-workflow.component.spec.ts | 25 +-
.../service/user/download/download.service.spec.ts | 365 +++++----
.../service/user/download/download.service.ts | 2 -
.../annotation-suggestion.component.spec.ts | 87 ++
.../breakpoint-condition-input.component.spec.ts | 11 +-
.../code-debugger.component.spec.ts | 29 +-
.../code-editor.component.spec.ts | 169 +++-
.../codearea-custom-template.component.spec.ts | 11 +-
.../left-panel/settings/settings.component.spec.ts | 172 ++++
.../time-travel/time-travel.component.spec.ts | 12 +-
.../versions-list/versions-list.component.spec.ts | 12 +-
.../component/menu/menu.component.spec.ts | 821 ++++++++++++-------
.../computing-unit-selection.component.html | 116 ++-
.../computing-unit-selection.component.ts | 266 ++++--
.../operator-property-edit-frame.component.spec.ts | 15 +-
.../result-panel/result-panel.component.html | 1 +
.../result-table-frame.component.html | 1 +
.../result-table-frame.component.spec.ts | 19 +-
.../context-menu/context-menu.component.spec.ts | 14 +-
.../workflow-editor.component.spec.ts | 35 +-
.../component/workspace.component.spec.ts | 344 ++++++++
.../service/drag-drop/drag-drop.service.spec.ts | 172 ++--
.../operator-debug/udf-debug.service.spec.ts | 16 +-
.../service/preset/preset.service.spec.ts | 870 ++++++++++----------
.../virtual-environment.service.ts | 20 +-
.../workflow-result-export.service.spec.ts | 10 +-
.../workflow-result.service.spec.ts | 8 +-
frontend/src/jsdom-svg-polyfill.ts | 27 +-
frontend/src/styles.scss | 69 +-
frontend/src/tsconfig.spec.json | 43 +-
frontend/vitest.browser.config.ts | 59 ++
frontend/vitest.config.ts | 11 +
frontend/yarn.lock | 897 ++++++++++++++++-----
licenses-3rd-party-code/angular.md | 9 +
.../mbknor-jackson-jsonschema.txt | 4 +-
licenses-3rd-party-code/monaco-languageclient.txt | 9 +
project/JdkOptions.scala | 57 ++
workflow-compiling-service/LICENSE-binary | 5 +-
523 files changed, 16808 insertions(+), 3700 deletions(-)
delete mode 100644 .github/workflows/auto-queue.yml
create mode 100644 .github/workflows/comment-commands.yml
delete mode 100644 .github/workflows/take-commands.yml
copy bin/frontend-dev.sh => .jvmopts (56%)
rename amber/{src/main/python => }/pyproject.toml (50%)
delete mode 100644
amber/src/main/python/core/storage/runnables/test_input_port_materialization_reader_runnable.py
rename amber/src/main/python/core/util/{thread => }/atomic.py (97%)
rename amber/src/main/python/core/util/{protocol => }/base_protocols.py (100%)
rename amber/src/main/python/core/util/{expression_evaluator/__init__.py =>
expression_evaluator.py} (100%)
delete mode 100644 amber/src/main/python/core/util/operator/__init__.py
rename amber/src/main/python/core/util/{runnable => }/runnable.py (100%)
delete mode 100644 amber/src/main/python/core/util/thread/__init__.py
rename amber/src/main/python/core/util/{virtual_identity/__init__.py =>
virtual_identity.py} (84%)
rename
amber/src/main/scala/org/apache/texera/amber/engine/architecture/common/{AkkaActorRefMappingService.scala
=> PekkoActorRefMappingService.scala} (98%)
rename
amber/src/main/scala/org/apache/texera/amber/engine/architecture/common/{AkkaActorService.scala
=> PekkoActorService.scala} (96%)
rename
amber/src/main/scala/org/apache/texera/amber/engine/architecture/common/{AkkaMessageTransferService.scala
=> PekkoMessageTransferService.scala} (98%)
rename
amber/src/main/scala/org/apache/texera/amber/engine/architecture/worker/managers/{OutputPortResultWriterThread.scala
=> OutputPortStorageWriterThread.scala} (52%)
create mode 100644
amber/src/test/integration/org/apache/texera/amber/storage/iceberg/IcebergRestCatalogIntegrationSpec.scala
rename amber/src/{main =>
test}/python/core/architecture/handlers/control/test_debug_command_handler.py
(100%)
rename amber/src/{main =>
test}/python/core/architecture/handlers/control/test_evaluate_expression_handler.py
(100%)
rename amber/src/{main =>
test}/python/core/architecture/handlers/control/test_replay_current_tuple_handler.py
(100%)
rename amber/src/{main =>
test}/python/core/architecture/handlers/control/test_update_executor_handler.py
(100%)
rename amber/src/{main =>
test}/python/core/architecture/managers/test_console_message_manager.py (100%)
rename amber/src/{main =>
test}/python/core/architecture/managers/test_debug_manager.py (100%)
rename amber/src/{main =>
test}/python/core/architecture/managers/test_embedded_control_message_manager.py
(100%)
rename amber/src/{main =>
test}/python/core/architecture/managers/test_exception_manager.py (100%)
rename amber/src/{main =>
test}/python/core/architecture/managers/test_executor_manager.py (93%)
rename amber/src/{main =>
test}/python/core/architecture/managers/test_pause_manager.py (100%)
rename amber/src/{main =>
test}/python/core/architecture/managers/test_state_manager.py (100%)
rename amber/src/{main =>
test}/python/core/architecture/managers/test_state_processing_manager.py (100%)
rename amber/src/{main =>
test}/python/core/architecture/managers/test_statistics_manager.py (100%)
rename amber/src/{main =>
test}/python/core/architecture/managers/test_tuple_processing_manager.py (100%)
create mode 100644
amber/src/test/python/core/architecture/packaging/test_output_manager.py
create mode 100644
amber/src/test/python/core/architecture/packaging/test_state_materialization_e2e.py
rename amber/src/{main =>
test}/python/core/architecture/rpc/test_async_rpc_client.py (100%)
rename amber/src/{main =>
test}/python/core/architecture/sendsemantics/test_partitioners.py (100%)
rename amber/src/{main => test}/python/core/models/schema/test_schema.py (100%)
rename amber/src/{main => test}/python/core/models/test_operator.py (88%)
rename amber/src/{main => test}/python/core/models/test_state.py (100%)
rename amber/src/{main => test}/python/core/models/test_table.py (100%)
rename amber/src/{main => test}/python/core/models/test_tuple.py (100%)
rename amber/src/{main => test}/python/core/models/type/test_large_binary.py
(100%)
rename amber/src/{main => test}/python/core/proxy/test_proxy_client.py (98%)
rename amber/src/{main => test}/python/core/proxy/test_proxy_server.py (98%)
rename amber/src/{main => test}/python/core/runnables/test_console_message.py
(100%)
create mode 100644 amber/src/test/python/core/runnables/test_data_processor.py
rename amber/src/{main => test}/python/core/runnables/test_heartbeat.py (100%)
rename amber/src/{main => test}/python/core/runnables/test_main_loop.py (90%)
rename amber/src/{main => test}/python/core/runnables/test_network_receiver.py
(100%)
rename amber/src/{main => test}/python/core/runnables/test_network_sender.py
(100%)
rename amber/src/{main =>
test}/python/core/storage/iceberg/test_iceberg_document.py (91%)
create mode 100644
amber/src/test/python/core/storage/iceberg/test_iceberg_rest_catalog_integration.py
rename amber/src/{main =>
test}/python/core/storage/iceberg/test_iceberg_utils_catalog.py (100%)
rename amber/src/{main =>
test}/python/core/storage/iceberg/test_iceberg_utils_large_binary.py (100%)
create mode 100644
amber/src/test/python/core/storage/runnables/test_input_port_materialization_reader_runnable.py
copy amber/src/{main => test}/python/core/storage/test_document_factory.py
(100%)
create mode 100644 amber/src/test/python/core/test_python_worker.py
rename amber/src/{main =>
test}/python/core/util/console_message/test_replace_print.py (100%)
rename amber/src/{main =>
test}/python/core/util/customized_queue/test_inner.py (100%)
rename amber/src/{main =>
test}/python/core/util/customized_queue/test_linked_blocking_multi_queue.py
(100%)
rename amber/src/{main/python/core/util/thread =>
test/python/core/util}/test_atomic.py (75%)
rename amber/src/{main/python/core/util/expression_evaluator =>
test/python/core/util}/test_expression_evaluator.py (99%)
rename amber/src/{main/python/core/util/virtual_identity =>
test/python/core/util}/test_virtual_identity.py (83%)
rename amber/src/{main =>
test}/python/pytexera/storage/test_dataset_file_document.py (100%)
rename amber/src/{main =>
test}/python/pytexera/storage/test_large_binary_input_stream.py (100%)
rename amber/src/{main =>
test}/python/pytexera/storage/test_large_binary_manager.py (100%)
rename amber/src/{main =>
test}/python/pytexera/storage/test_large_binary_output_stream.py (100%)
rename amber/src/{main =>
test}/python/pytexera/udf/examples/test_count_batch_operator.py (98%)
rename amber/src/{main =>
test}/python/pytexera/udf/examples/test_echo_operator.py (95%)
rename amber/src/{main =>
test}/python/pytexera/udf/examples/test_echo_table_operator.py (95%)
rename amber/src/{main =>
test}/python/pytexera/udf/examples/test_generator_operator_binary.py (93%)
rename amber/src/{main =>
test}/python/pytexera/udf/examples/test_generator_operator_integer.py (93%)
create mode 100644
amber/src/test/scala/org/apache/texera/amber/engine/architecture/sendsemantics/partitioners/NetworkOutputBufferSpec.scala
create mode 100644
amber/src/test/scala/org/apache/texera/amber/engine/architecture/worker/managers/OutputPortStorageWriterThreadSpec.scala
create mode 100644
amber/src/test/scala/org/apache/texera/workflow/LogicalLinkSpec.scala
create mode 100644
amber/src/test/scala/org/apache/texera/workflow/WorkflowCompilerSpec.scala
copy amber/{requirements.txt => system-requirements-lock.txt} (57%)
create mode 120000 bin/k8s/files/texera_lakekeeper.sql
create mode 100644 bin/k8s/templates/lakekeeper-init-job.yaml
rename
common/config/src/main/scala/org/apache/texera/amber/config/{AkkaConfig.scala
=> PekkoConfig.scala} (90%)
create mode 100644
common/dao/src/main/scala/org/apache/texera/dao/SiteSettings.scala
create mode 100644
common/dao/src/test/scala/org/apache/texera/dao/SiteSettingsSpec.scala
create mode 100644
common/dao/src/test/scala/org/apache/texera/dao/SqlServerSpec.scala
create mode 100644
common/pybuilder/src/test/scala/org/apache/texera/amber/pybuilder/PythonTemplateBuilderApiSpec.scala
create mode 100644
common/workflow-core/src/test/scala/org/apache/texera/amber/util/serde/PortIdentitySerdeSpec.scala
delete mode 100644
common/workflow-operator/src/main/scala/org/apache/texera/amber/operator/source/scan/json/JSONUtil.scala
create mode 100644
common/workflow-operator/src/test/scala/org/apache/texera/amber/operator/source/scan/csv/CSVScanSourceOpExecSpec.scala
create mode 100644 docs/_index.md
create mode 100644 docs/concepts/_index.md
create mode 100644 docs/contribution-guidelines/_index.md
create mode 100644 docs/contribution-guidelines/apache-license-header.md
create mode 100644 docs/contribution-guidelines/guide-for-developers.md
create mode 100644
docs/contribution-guidelines/guide-to-frontend-development.md
create mode 100644
docs/contribution-guidelines/guide-to-implement-java-operator.md
create mode 100644
docs/contribution-guidelines/guide-to-implement-python-operator.md
create mode 100644 docs/contribution-guidelines/making-contributions.md
create mode 100644 docs/contribution-guidelines/micro-services-local-dev.md
create mode 100644 docs/contribution-guidelines/release-email-template.md
create mode 100644 docs/examples/_index.md
create mode 100644 docs/getting-started/AccessLogin.md
create mode 100644 docs/getting-started/_index.md
create mode 100644 docs/getting-started/install-texera.md
copy bin/single-node/README.md =>
docs/getting-started/installing-using-docker.md (69%)
create mode 100644 docs/getting-started/run-on-kubernetes.md
create mode 100644 docs/getting-started/ui-overview.md
create mode 100644 docs/overview.md
create mode 100644 docs/reference/_index.md
create mode 100644 docs/reference/configuration.md
create mode 100644 docs/reference/engine.md
create mode 100644 docs/reference/frontend.md
create mode 100644 docs/reference/operators/_index.md
create mode 100644 docs/reference/operators/control-block/_index.md
create mode 100644 docs/reference/operators/control-block/if.md
create mode 100644 docs/reference/operators/control-block/sleep.md
create mode 100644 docs/reference/operators/data-cleaning/_index.md
create mode 100644 docs/reference/operators/data-cleaning/aggregate/_index.md
create mode 100644
docs/reference/operators/data-cleaning/aggregate/aggregate.md
create mode 100644 docs/reference/operators/data-cleaning/distinct.md
create mode 100644 docs/reference/operators/data-cleaning/filter.md
create mode 100644 docs/reference/operators/data-cleaning/join/_index.md
create mode 100644
docs/reference/operators/data-cleaning/join/cartesian-product.md
create mode 100644 docs/reference/operators/data-cleaning/join/hash-join.md
create mode 100644 docs/reference/operators/data-cleaning/join/interval-join.md
create mode 100644 docs/reference/operators/data-cleaning/limit.md
create mode 100644 docs/reference/operators/data-cleaning/projection.md
create mode 100644 docs/reference/operators/data-cleaning/set/_index.md
create mode 100644 docs/reference/operators/data-cleaning/set/difference.md
create mode 100644 docs/reference/operators/data-cleaning/set/intersect.md
create mode 100644
docs/reference/operators/data-cleaning/set/symmetricdifference.md
create mode 100644 docs/reference/operators/data-cleaning/set/union.md
create mode 100644 docs/reference/operators/data-cleaning/sort/_index.md
create mode 100644
docs/reference/operators/data-cleaning/sort/sort-partitions.md
create mode 100644 docs/reference/operators/data-cleaning/sort/sort.md
create mode 100644
docs/reference/operators/data-cleaning/sort/stable-merge-sort.md
create mode 100644 docs/reference/operators/data-cleaning/type-casting.md
create mode 100644 docs/reference/operators/data-input/_index.md
create mode 100644 docs/reference/operators/data-input/arrow-file-scan.md
create mode 100644 docs/reference/operators/data-input/csv-file-scan.md
create mode 100644 docs/reference/operators/data-input/csvold-file-scan.md
create mode 100644 docs/reference/operators/data-input/file-lister.md
create mode 100644 docs/reference/operators/data-input/file-scan-from-input.md
create mode 100644 docs/reference/operators/data-input/file-scan.md
create mode 100644 docs/reference/operators/data-input/jsonl-file-scan.md
create mode 100644 docs/reference/operators/data-input/text-input.md
create mode 100644 docs/reference/operators/database-connector/_index.md
create mode 100644
docs/reference/operators/database-connector/asterixdb-source.md
create mode 100644 docs/reference/operators/database-connector/mysql-source.md
create mode 100644
docs/reference/operators/database-connector/postgresql-source.md
create mode 100644 docs/reference/operators/external-api/_index.md
create mode 100644 docs/reference/operators/external-api/reddit-search.md
create mode 100644
docs/reference/operators/external-api/twitter-full-archive-search-api.md
create mode 100644 docs/reference/operators/external-api/twitter-search-api.md
create mode 100644 docs/reference/operators/external-api/url-fetcher.md
create mode 100644 docs/reference/operators/machine-learning/_index.md
create mode 100644
docs/reference/operators/machine-learning/advanced-sklearn/_index.md
create mode 100644
docs/reference/operators/machine-learning/advanced-sklearn/knn-classifier.md
create mode 100644
docs/reference/operators/machine-learning/advanced-sklearn/knn-regressor.md
create mode 100644
docs/reference/operators/machine-learning/advanced-sklearn/svm-classifier.md
create mode 100644
docs/reference/operators/machine-learning/advanced-sklearn/svm-regressor.md
create mode 100644
docs/reference/operators/machine-learning/hugging-face/_index.md
create mode 100644
docs/reference/operators/machine-learning/hugging-face/hugging-face-iris-logistic-regression.md
create mode 100644
docs/reference/operators/machine-learning/hugging-face/hugging-face-sentiment-analysis.md
create mode 100644
docs/reference/operators/machine-learning/hugging-face/hugging-face-spam-detection.md
create mode 100644
docs/reference/operators/machine-learning/hugging-face/hugging-face-text-summarization.md
create mode 100644
docs/reference/operators/machine-learning/machine-learning-general/_index.md
create mode 100644
docs/reference/operators/machine-learning/machine-learning-general/machine-learning-scorer.md
create mode 100644 docs/reference/operators/machine-learning/sklearn/_index.md
create mode 100644
docs/reference/operators/machine-learning/sklearn/adaptive-boosting.md
create mode 100644 docs/reference/operators/machine-learning/sklearn/bagging.md
create mode 100644
docs/reference/operators/machine-learning/sklearn/bernoulli-naive-bayes.md
create mode 100644
docs/reference/operators/machine-learning/sklearn/complement-naive-bayes.md
create mode 100644
docs/reference/operators/machine-learning/sklearn/decision-tree.md
create mode 100644
docs/reference/operators/machine-learning/sklearn/dummy-classifier.md
create mode 100644
docs/reference/operators/machine-learning/sklearn/extra-tree.md
create mode 100644
docs/reference/operators/machine-learning/sklearn/extra-trees.md
create mode 100644
docs/reference/operators/machine-learning/sklearn/gaussian-naive-bayes.md
create mode 100644
docs/reference/operators/machine-learning/sklearn/gradient-boosting.md
create mode 100644
docs/reference/operators/machine-learning/sklearn/k-nearest-neighbors.md
create mode 100644
docs/reference/operators/machine-learning/sklearn/linear-perceptron.md
create mode 100644
docs/reference/operators/machine-learning/sklearn/linear-regression.md
create mode 100644
docs/reference/operators/machine-learning/sklearn/linear-support-vector-machine.md
create mode 100644
docs/reference/operators/machine-learning/sklearn/logistic-regression-cross-validation.md
create mode 100644
docs/reference/operators/machine-learning/sklearn/logistic-regression.md
create mode 100644
docs/reference/operators/machine-learning/sklearn/multi-layer-perceptron.md
create mode 100644
docs/reference/operators/machine-learning/sklearn/multinomial-naive-bayes.md
create mode 100644
docs/reference/operators/machine-learning/sklearn/nearest-centroid.md
create mode 100644
docs/reference/operators/machine-learning/sklearn/passive-aggressive.md
create mode 100644
docs/reference/operators/machine-learning/sklearn/probability-calibration.md
create mode 100644
docs/reference/operators/machine-learning/sklearn/random-forest.md
create mode 100644
docs/reference/operators/machine-learning/sklearn/ridge-regression-cross-validation.md
create mode 100644
docs/reference/operators/machine-learning/sklearn/ridge-regression.md
create mode 100644
docs/reference/operators/machine-learning/sklearn/sklearn-prediction.md
create mode 100644
docs/reference/operators/machine-learning/sklearn/sklearn-testing.md
create mode 100644
docs/reference/operators/machine-learning/sklearn/sklearn-training/_index.md
create mode 100644
docs/reference/operators/machine-learning/sklearn/sklearn-training/training-adaptive-boosting.md
create mode 100644
docs/reference/operators/machine-learning/sklearn/sklearn-training/training-bagging-training.md
create mode 100644
docs/reference/operators/machine-learning/sklearn/sklearn-training/training-bernoulli-naive-bayes.md
create mode 100644
docs/reference/operators/machine-learning/sklearn/sklearn-training/training-complement-naive-bayes.md
create mode 100644
docs/reference/operators/machine-learning/sklearn/sklearn-training/training-decision-tree.md
create mode 100644
docs/reference/operators/machine-learning/sklearn/sklearn-training/training-dummy-classifier.md
create mode 100644
docs/reference/operators/machine-learning/sklearn/sklearn-training/training-extra-tree.md
create mode 100644
docs/reference/operators/machine-learning/sklearn/sklearn-training/training-extra-trees.md
create mode 100644
docs/reference/operators/machine-learning/sklearn/sklearn-training/training-gaussian-naive-bayes.md
create mode 100644
docs/reference/operators/machine-learning/sklearn/sklearn-training/training-gradient-boosting.md
create mode 100644
docs/reference/operators/machine-learning/sklearn/sklearn-training/training-k-nearest-neighbors.md
create mode 100644
docs/reference/operators/machine-learning/sklearn/sklearn-training/training-linear-perceptron.md
create mode 100644
docs/reference/operators/machine-learning/sklearn/sklearn-training/training-linear-regression.md
create mode 100644
docs/reference/operators/machine-learning/sklearn/sklearn-training/training-linear-support-vector-machine.md
create mode 100644
docs/reference/operators/machine-learning/sklearn/sklearn-training/training-logistic-regression-cross-validation.md
create mode 100644
docs/reference/operators/machine-learning/sklearn/sklearn-training/training-logistic-regression.md
create mode 100644
docs/reference/operators/machine-learning/sklearn/sklearn-training/training-multi-layer-perceptron.md
create mode 100644
docs/reference/operators/machine-learning/sklearn/sklearn-training/training-multinomial-naive-bayes.md
create mode 100644
docs/reference/operators/machine-learning/sklearn/sklearn-training/training-nearest-centroid.md
create mode 100644
docs/reference/operators/machine-learning/sklearn/sklearn-training/training-passive-aggressive.md
create mode 100644
docs/reference/operators/machine-learning/sklearn/sklearn-training/training-probability-calibration.md
create mode 100644
docs/reference/operators/machine-learning/sklearn/sklearn-training/training-random-forest.md
create mode 100644
docs/reference/operators/machine-learning/sklearn/sklearn-training/training-ridge-regression-cross-validation.md
create mode 100644
docs/reference/operators/machine-learning/sklearn/sklearn-training/training-ridge-regression.md
create mode 100644
docs/reference/operators/machine-learning/sklearn/sklearn-training/training-stochastic-gradient-descent.md
create mode 100644
docs/reference/operators/machine-learning/sklearn/sklearn-training/training-support-vector-machine.md
create mode 100644
docs/reference/operators/machine-learning/sklearn/stochastic-gradient-descent.md
create mode 100644
docs/reference/operators/machine-learning/sklearn/support-vector-machine.md
create mode 100644 docs/reference/operators/output-modes.md
create mode 100644 docs/reference/operators/parameters/_index.md
create mode 100644
docs/reference/operators/parameters/sklearn-advanced-knn-parameters.md
create mode 100644
docs/reference/operators/parameters/sklearn-advanced-svc-parameters.md
create mode 100644
docs/reference/operators/parameters/sklearn-advanced-svr-parameters.md
create mode 100644 docs/reference/operators/search/_index.md
create mode 100644 docs/reference/operators/search/dictionary-matcher.md
create mode 100644 docs/reference/operators/search/keyword-search.md
create mode 100644 docs/reference/operators/search/regular-expression.md
create mode 100644 docs/reference/operators/search/substring-search.md
create mode 100644 docs/reference/operators/user-defined-functions/_index.md
create mode 100644
docs/reference/operators/user-defined-functions/java/_index.md
create mode 100644
docs/reference/operators/user-defined-functions/java/java-udf.md
create mode 100644
docs/reference/operators/user-defined-functions/python/1-out-python-udf.md
create mode 100644
docs/reference/operators/user-defined-functions/python/2-in-python-udf.md
create mode 100644
docs/reference/operators/user-defined-functions/python/_index.md
create mode 100644
docs/reference/operators/user-defined-functions/python/python-lambda-function.md
create mode 100644
docs/reference/operators/user-defined-functions/python/python-table-reducer.md
create mode 100644
docs/reference/operators/user-defined-functions/python/python-udf.md
create mode 100644
docs/reference/operators/user-defined-functions/r/1-out-r-udf.md
create mode 100644 docs/reference/operators/user-defined-functions/r/_index.md
create mode 100644 docs/reference/operators/user-defined-functions/r/r-udf.md
create mode 100644 docs/reference/operators/utilities/_index.md
create mode 100644 docs/reference/operators/utilities/random-k-sampling.md
create mode 100644 docs/reference/operators/utilities/reservoir-sampling.md
create mode 100644 docs/reference/operators/utilities/split.md
create mode 100644 docs/reference/operators/utilities/unnest-string.md
create mode 100644 docs/reference/operators/visualization/_index.md
create mode 100644 docs/reference/operators/visualization/advanced/_index.md
create mode 100644
docs/reference/operators/visualization/advanced/choropleth-map.md
create mode 100644
docs/reference/operators/visualization/advanced/scatter3d-chart.md
create mode 100644 docs/reference/operators/visualization/basic/_index.md
create mode 100644 docs/reference/operators/visualization/basic/bar-chart.md
create mode 100644 docs/reference/operators/visualization/basic/bubble-chart.md
create mode 100644 docs/reference/operators/visualization/basic/dot-plot.md
create mode 100644
docs/reference/operators/visualization/basic/dumbbell-plot.md
create mode 100644
docs/reference/operators/visualization/basic/figure-factory-table.md
create mode 100644
docs/reference/operators/visualization/basic/filled-area-plot.md
create mode 100644 docs/reference/operators/visualization/basic/gantt-chart.md
create mode 100644
docs/reference/operators/visualization/basic/hierarchy-chart.md
create mode 100644 docs/reference/operators/visualization/basic/icicle-chart.md
create mode 100644 docs/reference/operators/visualization/basic/line-chart.md
create mode 100644 docs/reference/operators/visualization/basic/pie-chart.md
create mode 100644 docs/reference/operators/visualization/basic/range-slider.md
create mode 100644
docs/reference/operators/visualization/basic/sankey-diagram.md
create mode 100644 docs/reference/operators/visualization/basic/scatter-plot.md
create mode 100644 docs/reference/operators/visualization/basic/tables-plot.md
create mode 100644
docs/reference/operators/visualization/basic/time-series-plot.md
create mode 100644 docs/reference/operators/visualization/financial/_index.md
create mode 100644
docs/reference/operators/visualization/financial/bullet-chart.md
create mode 100644
docs/reference/operators/visualization/financial/candlestick-chart.md
create mode 100644
docs/reference/operators/visualization/financial/funnel-plot.md
create mode 100644
docs/reference/operators/visualization/financial/gauge-chart.md
create mode 100644
docs/reference/operators/visualization/financial/waterfall-chart.md
create mode 100644 docs/reference/operators/visualization/media/_index.md
create mode 100644
docs/reference/operators/visualization/media/html-visualizer.md
create mode 100644
docs/reference/operators/visualization/media/image-visualizer.md
create mode 100644
docs/reference/operators/visualization/media/url-visualizer.md
create mode 100644 docs/reference/operators/visualization/media/word-cloud.md
create mode 100644 docs/reference/operators/visualization/nested-table.md
create mode 100644 docs/reference/operators/visualization/scientific/_index.md
create mode 100644
docs/reference/operators/visualization/scientific/carpet-plot.md
create mode 100644
docs/reference/operators/visualization/scientific/contour-plot.md
create mode 100644
docs/reference/operators/visualization/scientific/dendrogram.md
create mode 100644 docs/reference/operators/visualization/scientific/heatmap.md
create mode 100644
docs/reference/operators/visualization/scientific/network-graph.md
create mode 100644
docs/reference/operators/visualization/scientific/parallel-coordinates-plot.md
create mode 100644
docs/reference/operators/visualization/scientific/polar-chart.md
create mode 100644
docs/reference/operators/visualization/scientific/quiver-plot.md
create mode 100644
docs/reference/operators/visualization/scientific/radar-chart.md
create mode 100644
docs/reference/operators/visualization/scientific/radar-plot.md
create mode 100644
docs/reference/operators/visualization/scientific/ternary-contour.md
create mode 100644
docs/reference/operators/visualization/scientific/ternary-plot.md
create mode 100644
docs/reference/operators/visualization/scientific/volcano-plot.md
create mode 100644
docs/reference/operators/visualization/scientific/wind-rose-chart.md
create mode 100644 docs/reference/operators/visualization/statistical/_index.md
create mode 100644
docs/reference/operators/visualization/statistical/boxviolin-plot.md
create mode 100644
docs/reference/operators/visualization/statistical/continuous-error-bands.md
create mode 100644
docs/reference/operators/visualization/statistical/empirical-cumulative-distribution-plot.md
create mode 100644
docs/reference/operators/visualization/statistical/histogram.md
create mode 100644
docs/reference/operators/visualization/statistical/histogram2d.md
create mode 100644
docs/reference/operators/visualization/statistical/scatter-matrix-chart.md
create mode 100644
docs/reference/operators/visualization/statistical/strip-chart.md
create mode 100644
docs/reference/operators/visualization/statistical/tree-plot.md
create mode 100644 docs/reference/project-structure.md
create mode 100644 docs/reference/storage.md
copy SECURITY.md => docs/security/_index.md (66%)
create mode 100644 docs/tutorials/_index.md
create mode 100644 docs/tutorials/create-dataset-upload-data.md
create mode 100644 docs/tutorials/guide-for-how-to-use-texera.md
create mode 100644 docs/tutorials/guide-to-enable-llm-agent.md
create mode 100644 docs/tutorials/guide-to-launch-lakekeeper.md
create mode 100644 docs/tutorials/guide-to-use-python-udf.md
create mode 100644 docs/tutorials/migrate-jupyter-notebook.md
create mode 100644
frontend/src/app/workspace/component/code-editor-dialog/annotation-suggestion.component.spec.ts
create mode 100644 frontend/vitest.browser.config.ts
create mode 100644 licenses-3rd-party-code/angular.md
copy licenses/LICENSE-MIT.txt =>
licenses-3rd-party-code/mbknor-jackson-jsonschema.txt (95%)
create mode 100644 licenses-3rd-party-code/monaco-languageclient.txt
create mode 100644 project/JdkOptions.scala