# Licensed to the Apache Software Foundation (ASF) under one or more
# contributor license agreements.  See the NOTICE file distributed with
# this work for additional information regarding copyright ownership.
# The ASF licenses this file to You under the Apache License, Version 2.0
# (the "License"); you may not use this file except in compliance with
# the License.  You may obtain a copy of the License at
#
#    http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

--runner=DataflowRunner
--region=us-central1
--temp_location=gs://temp-storage-for-perf-tests/loadtests
--staging_location=gs://temp-storage-for-perf-tests/loadtests
--input=gs://apache-beam-ml/testing/inputs/sentences_50k.txt
--machine_type=n1-standard-8
--worker_zone=us-central1-b
--disk_size_gb=50
--input_options={}
--num_workers=8
--max_num_workers=25
--autoscaling_algorithm=THROUGHPUT_BASED
--publish_to_big_query=true
--sdk_location=container
--output_table=apache-beam-testing.beam_run_inference.result_gemma_vllm_batch
--metrics_dataset=beam_run_inference
--metrics_table=gemma_vllm_batch
--influx_measurement=gemma_vllm_batch
--model_gcs_path=gs://apache-beam-ml/models/gemma-2b-it
--dataflow_service_options=worker_accelerator=type:nvidia-tesla-t4;count:1;install-nvidia-driver
--experiments=use_runner_v2