- cache_dir (olive.engine.EngineConfig attribute)
-
calibrate_method
-
calibration_sampling_size
-
checkpoint_path
- clean_cache (olive.engine.EngineConfig attribute)
- clean_evaluation_cache (olive.engine.EngineConfig attribute)
-
command line option
- activation_type, [1], [2]
- ActivationSymmetric, [1], [2], [3]
- AddQDQPairToWeight
- algorithms
- all_tensors_to_one_file, [1], [2], [3], [4], [5], [6], [7], [8], [9], [10], [11], [12], [13], [14], [15], [16], [17]
- approach, [1], [2]
- azureml_client, [1], [2]
- backend, [1], [2]
- batch_size, [1], [2], [3], [4], [5], [6]
- blocksize
- calibrate_method, [1], [2]
- calibration_sampling_size, [1]
- checkpoint_path
- compute_device
- compute_dtype
- cpu_cores
- data_config, [1], [2], [3], [4], [5], [6], [7], [8]
- data_dir, [1], [2], [3], [4], [5], [6], [7]
- dataloader_func, [1], [2], [3], [4], [5], [6], [7]
- datastore_name
- datastore_url
- device, [1], [2], [3]
- disable_shape_infer
- do_validate
- domain, [1], [2]
- double_quant
- enable_cuda_graph
- enable_dpu
- enable_htp
- EnableSubgraph, [1], [2]
- engine_config
- eval_data_config
- eval_dataset_size
- excluded_precisions, [1], [2]
- execution_mode_list
- external_data_name, [1], [2], [3], [4], [5], [6], [7], [8], [9], [10], [11], [12], [13], [14], [15], [16], [17]
- extra.Sigmoid.nnapi, [1], [2]
- extra_args, [1]
- extra_config
- extra_options, [1], [2], [3]
- extra_session_config
- float16, [1]
- force_fp32_ops
- ForceQuantizeNoInputCheck, [1], [2]
- gpus
- group
- hidden_size
- htp_socs
- input
- input_int32
- input_layouts
- input_names, [1]
- input_nodes
- input_shape
- input_shapes, [1]
- input_types, [1]
- inter_thread_num_list
- intra_thread_num_list
- io_bind
- job_name
- keep_io_types, [1]
- layer_name_filter, [1]
- logger
- lora_alpha
- lora_dropout
- lora_r
- MatMulConstBOnly, [1], [2]
- max_finite_val
- max_layer, [1]
- metric, [1], [2]
- metric_func
- min_layer, [1]
- min_positive_val
- model_type
- modules_to_fuse
- multivariate
- name, [1]
- need_layer_fusing
- no_repeat_ngram_size
- node_block_list
- nodes_to_exclude, [1], [2], [3]
- nodes_to_quantize, [1], [2], [3]
- num_epochs
- num_heads
- num_samples, [1]
- num_steps
- only_onnxruntime
- op_block_list, [1]
- op_types_to_quantize, [1], [2], [3]
- opt_level
- opt_level_list
- optimization_options
- optimize_model
- output_name
- output_names
- output_nodes
- path, [1]
- per_channel, [1], [2], [3]
- percdamp
- post
- pre
- providers_list
- ptl_data_module
- ptl_module
- qconfig_func
- quant_format, [1], [2], [3], [4]
- quant_level, [1], [2]
- quant_mode, [1], [2], [3]
- quant_preprocess, [1], [2], [3]
- quant_type
- recipes, [1], [2]
- reduce_range, [1], [2], [3], [4], [5]
- relative_path, [1]
- save_as_external_data, [1], [2], [3], [4], [5], [6], [7], [8], [9], [10], [11], [12], [13], [14], [15], [16], [17]
- script_dir, [1], [2], [3], [4], [5], [6], [7], [8], [9], [10], [11]
- seed, [1], [2]
- sparsity
- target_device
- target_opset, [1], [2], [3], [4]
- tool_command
- tool_command_args
- train_batch_size
- train_data_config
- train_data_dir
- train_dataloader_func
- training_args
- training_loop_func
- trt_fp16_enable
- tuning_criterion, [1], [2]
- use_dynamo_exporter, [1]
- use_enhanced_quantizer
- use_external_data_format
- use_forced_decoder_ids
- use_gpu
- user_script, [1], [2], [3], [4], [5], [6], [7], [8], [9], [10], [11]
- val_data_dir
- version
- weight_only_config, [1], [2]
- weight_type, [1], [2], [3]
- WeightSymmetric, [1], [2], [3]
- with_replacement
|
|