optimum-neuron-cache
/
neuronxcc-2.17.194.0+d312836f
/MODULE_003eca68b53533d6f2a7+bfc62e4c
/compile_flags.json
"--enable-saturate-infinity --enable-mixed-precision-accumulation --model-type transformer -O1 --tensorizer-options='--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2' --internal-enable-dge-levels vector_dynamic_offsets --logfile=/tmp/nxd_model/token_generation_model/_tp0_bk0/log-neuron-cc.txt --enable-internal-neff-wrapper" |