-
Notifications
You must be signed in to change notification settings - Fork 2
Expand file tree
/
Copy pathexample_segment_identity_dataflow.sh
More file actions
executable file
·33 lines (32 loc) · 1.36 KB
/
example_segment_identity_dataflow.sh
File metadata and controls
executable file
·33 lines (32 loc) · 1.36 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
#!/bin/bash
## Usage:
## ./example_segment.sh scratch_output
if [ -z $1 ]; then grep "^##" $(dirname $0)/$(basename $0); exit 1; else DATASET_OUT=$1; fi
echo "Output dataset ${DATASET_OUT}."
docker compose run --rm dev segment_identity \
--date_range='2025-01-01,2025-01-01' \
--source_segments=world-fishing-827.${DATASET_OUT}.internal__segments \
--source_fragments=world-fishing-827.${DATASET_OUT}.internal__fragments \
--dest_segment_identity=world-fishing-827.${DATASET_OUT}.internal__segment_identity_daily \
--setup_file=./setup.py \
--sdk_container_image=gcr.io/world-fishing-827/github.com/globalfishingwatch/pipe-segment/worker:v4.4.1 \
--labels=environment=develop \
--labels=resource_creator=local_example \
--labels=project=core_pipeline \
--labels=version=v3 \
--labels=step=segment \
--labels=stage=productive \
--runner=dataflow \
--wait_for_job \
--project=world-fishing-827 \
--temp_location=gs://pipe-temp-us-central-ttl7/dataflow_temp \
--staging_location=gs://pipe-temp-us-central-ttl7/dataflow_staging \
--region=us-central1 \
--max_num_workers=600 \
--worker_machine_type=e2-standard-4 \
--disk_size_gb=50 \
--job_name=test-segment-segment-identity--20250101 \
--experiments=use_runner_v2 \
--no_use_public_ips \
--network=gfw-internal-network \
--subnetwork=regions/us-central1/subnetworks/gfw-internal-us-central1