Split
Split Certified

Split a file from Kestra internal storage.

yaml
type: io.kestra.plugin.core.storage.Split
yaml
    id: split_bytes
    namespace: company.team

    tasks:
      - id: download
        type: io.kestra.plugin.core.http.Download
        uri: https://huggingface.co/datasets/kestra/datasets/raw/main/csv/orders.csv

      - id: split
        type: io.kestra.plugin.core.storage.Split
        from: "{{ outputs.download.uri }}"
        bytes: 5KB

yaml
    id: split_rows
    namespace: company.team

    tasks:
      - id: download
        type: io.kestra.plugin.core.http.Download
        uri: https://huggingface.co/datasets/kestra/datasets/raw/main/csv/orders.csv

      - id: split
        type: io.kestra.plugin.core.storage.Split
        from: "{{ outputs.download.uri }}"
        rows: 10

yaml
    id: split_partitions
    namespace: company.team

    tasks:
      - id: download
        type: io.kestra.plugin.core.http.Download
        uri: https://huggingface.co/datasets/kestra/datasets/raw/main/csv/orders.csv

      - id: split
        type: io.kestra.plugin.core.storage.Split
        from: "{{ outputs.download.uri }}"
        partitions: 4

yaml
    id: storage_tasks
    namespace: company.team

    tasks:
      - id: generate_logs
        type: io.kestra.plugin.scripts.shell.Commands
        commands:
          - echo "INFO - wow
ERROR - no
INFO - ok" > logs.txt
        outputFiles:
          - logs.txt

      - id: split
        type: io.kestra.plugin.core.storage.Split
        from: "{{ outputs.echo.outputFiles['logs.txt'] }}"
        regexPattern: "^(\w+)"
Properties
Default\n
SubTypestring