{"templateId":"markdown","sharedDataIds":{"sidebar":"sidebar-sidebars.yaml"},"props":{"metadata":{"markdoc":{"tagList":[]},"redocly_category":"Products","product_name":"Machine Learning","type":"markdown"},"seo":{"title":"Managing the Machine Learning Pipeline","description":"Treasure Data Product Documentation · Collect and Unify · Segment and Activate · Experiment and Analyze · Decisioning Automate with AI Scale and Trust.","siteUrl":"https://docs.treasuredata.com","lang":"en-US","llmstxt":{"hide":false,"sections":[{"title":"Table of contents","includeFiles":["**/*"],"excludeFiles":[]}],"excludeFiles":[]}},"dynamicMarkdocComponents":[],"compilationErrors":[],"ast":{"$$mdtype":"Tag","name":"article","attributes":{},"children":[{"$$mdtype":"Tag","name":"Heading","attributes":{"level":1,"id":"managing-the-machine-learning-pipeline","__idx":0},"children":["Managing the Machine Learning Pipeline"]},{"$$mdtype":"Tag","name":"p","attributes":{},"children":["After ingesting your data into Treasure Data, you can build a predictive model using Treasure Data queries, and workflows."]},{"$$mdtype":"Tag","name":"p","attributes":{},"children":["The typical machine learning pipeline for supervised learning is:"]},{"$$mdtype":"Tag","name":"ol","attributes":{},"children":[{"$$mdtype":"Tag","name":"li","attributes":{},"children":[{"$$mdtype":"Tag","name":"p","attributes":{},"children":["data preparation"]}]},{"$$mdtype":"Tag","name":"li","attributes":{},"children":[{"$$mdtype":"Tag","name":"p","attributes":{},"children":["building a model"]}]},{"$$mdtype":"Tag","name":"li","attributes":{},"children":[{"$$mdtype":"Tag","name":"p","attributes":{},"children":["evaluating the model"]}]},{"$$mdtype":"Tag","name":"li","attributes":{},"children":[{"$$mdtype":"Tag","name":"p","attributes":{},"children":["predicting unseen data with trained model"]}]}]},{"$$mdtype":"Tag","name":"p","attributes":{},"children":["You can use Treasure Workflows to manage your supervised learning process. Treasure Data (TD) provides AutoML as a feature which can be configured within the familiar ",{"$$mdtype":"Tag","name":"MarkdownLink","attributes":{"href":"/products/customer-data-platform/data-workbench/workflows"},"children":["Treasure Workflow"]}," environment. Learn more about ",{"$$mdtype":"Tag","name":"MarkdownLink","attributes":{"href":"/products/customer-data-platform/machine-learning/automl"},"children":["AutoML"]}]},{"$$mdtype":"Tag","name":"p","attributes":{},"children":[{"$$mdtype":"Tag","name":"img","attributes":{"src":"/assets/105578848.2775c3c343559d67e1778594d2fc1c2403686c7398feafe43ccbdbe8a0ad1bce.3cb60505.png","alt":""},"children":[]}]},{"$$mdtype":"Tag","name":"p","attributes":{},"children":["By using Digdag Treasure Data operators within your Treasure Workflow, you can automate your machine learning from data preparation to prediction. Digdag Treasure Data operators include:"]},{"$$mdtype":"Tag","name":"ul","attributes":{},"children":[{"$$mdtype":"Tag","name":"li","attributes":{},"children":[{"$$mdtype":"Tag","name":"p","attributes":{},"children":[{"$$mdtype":"Tag","name":"MarkdownLink","attributes":{"href":"https://docs.digdag.io/operators/td.html"},"children":["td>: Treasure Data queries"]}]}]},{"$$mdtype":"Tag","name":"li","attributes":{},"children":[{"$$mdtype":"Tag","name":"p","attributes":{},"children":[{"$$mdtype":"Tag","name":"MarkdownLink","attributes":{"href":"https://docs.digdag.io/operators/td_run.html"},"children":["td_run>: Treasure Data saved queries"]}]}]},{"$$mdtype":"Tag","name":"li","attributes":{},"children":[{"$$mdtype":"Tag","name":"p","attributes":{},"children":[{"$$mdtype":"Tag","name":"MarkdownLink","attributes":{"href":"https://docs.digdag.io/operators/td_ddl.html"},"children":["td_ddl>: Treasure Data operations"]}]}]},{"$$mdtype":"Tag","name":"li","attributes":{},"children":[{"$$mdtype":"Tag","name":"p","attributes":{},"children":[{"$$mdtype":"Tag","name":"MarkdownLink","attributes":{"href":"https://docs.digdag.io/operators/td_load.html"},"children":["td_load>: Treasure Data bulk loading"]}]}]},{"$$mdtype":"Tag","name":"li","attributes":{},"children":[{"$$mdtype":"Tag","name":"p","attributes":{},"children":[{"$$mdtype":"Tag","name":"MarkdownLink","attributes":{"href":"https://docs.digdag.io/operators/td_for_each.html"},"children":["td_for_each>: Repeat using Treasure Data queries"]}]}]},{"$$mdtype":"Tag","name":"li","attributes":{},"children":[{"$$mdtype":"Tag","name":"p","attributes":{},"children":[{"$$mdtype":"Tag","name":"MarkdownLink","attributes":{"href":"https://docs.digdag.io/operators/td_wait.html"},"children":["td_wait>: Waits for data arriving at Treasure Data table"]}]}]},{"$$mdtype":"Tag","name":"li","attributes":{},"children":[{"$$mdtype":"Tag","name":"p","attributes":{},"children":[{"$$mdtype":"Tag","name":"MarkdownLink","attributes":{"href":"https://docs.digdag.io/operators/td_wait_table.html"},"children":["td_wait_table>: Waits for data arriving at Treasure Data table"]}]}]},{"$$mdtype":"Tag","name":"li","attributes":{},"children":[{"$$mdtype":"Tag","name":"p","attributes":{},"children":[{"$$mdtype":"Tag","name":"MarkdownLink","attributes":{"href":"https://docs.digdag.io/operators/td_partial_delete.html"},"children":["td_partial_delete>: Delete range of Treasure Data table"]}]}]},{"$$mdtype":"Tag","name":"li","attributes":{},"children":[{"$$mdtype":"Tag","name":"p","attributes":{},"children":[{"$$mdtype":"Tag","name":"MarkdownLink","attributes":{"href":"https://docs.digdag.io/operators/td_table_export.html"},"children":["td_table_export>: Treasure Data table export to S3"]}]}]}]},{"$$mdtype":"Tag","name":"p","attributes":{},"children":["Digdag can run tasks in parallel, so you can simultaneously run independent tasks such as parameter tuning. Treasure Workflows enable you to make prediction tasks a periodic part of your product offerings. Having a stable way to run and evolve your machine learning processes in batches on an hourly or daily basis is a good way to evolve them and derive a better predictive model."]},{"$$mdtype":"Tag","name":"p","attributes":{},"children":[{"$$mdtype":"Tag","name":"img","attributes":{"src":"/assets/105578847.ce353f50a12e39ebe398e8039749d93187b5c9e549cbd0c65abfa050a1499f71.3cb60505.png","alt":""},"children":[]}]}]},"headings":[{"value":"Managing the Machine Learning Pipeline","id":"managing-the-machine-learning-pipeline","depth":1}],"frontmatter":{"seo":{"title":"Managing the Machine Learning Pipeline"}},"lastModified":"2026-06-01T11:27:28.000Z","pagePropGetterError":{"message":"","name":""}},"slug":"/products/customer-data-platform/machine-learning/automl/managing-the-machine-learning-pipeline","userData":{"isAuthenticated":false,"teams":["anonymous"]},"isPublic":true}