|
{ |
|
"version": "QNN_SYSTEM_CONTEXT_BINARY_INFO_VERSION_3", |
|
"info": { |
|
"backendId": 6, |
|
"buildId": "v2.28.0.241029232508_102474", |
|
"coreApiVersion": "2.21.0", |
|
"backendApiVersion": "5.28.0", |
|
"socVersion": "", |
|
"contextBlobVersion": "3.2.0", |
|
"contextBlobSize": 566494808, |
|
"numContextTensors": 0, |
|
"contextTensors": [], |
|
"numGraphs": 2, |
|
"graphs": [ |
|
{ |
|
"version": "QNN_SYSTEM_CONTEXT_GRAPH_INFO_VERSION_3", |
|
"info": { |
|
"graphName": "ar128_cl4096_4_of_4", |
|
"numGraphInputs": 20, |
|
"graphInputs": [ |
|
{ |
|
"version": "QNN_TENSOR_VERSION_1", |
|
"info": { |
|
"id": 1, |
|
"name": "past_key_24_in", |
|
"type": "QNN_TENSOR_TYPE_APP_WRITE", |
|
"dataFormat": "QNN_TENSOR_DATA_FORMAT_FLAT_BUFFER", |
|
"dataType": "QNN_DATATYPE_UFIXED_POINT_8", |
|
"rank": 4, |
|
"dimensions": [ |
|
32, |
|
1, |
|
96, |
|
3968 |
|
], |
|
"memType": "QNN_TENSORMEMTYPE_MEMHANDLE", |
|
"quantizeParams": { |
|
"definition": "QNN_DEFINITION_DEFINED", |
|
"quantizationEncoding": "QNN_QUANTIZATION_ENCODING_SCALE_OFFSET", |
|
"scaleOffset": { |
|
"scale": 0.16835589706897736, |
|
"offset": -128 |
|
} |
|
} |
|
} |
|
}, |
|
{ |
|
"version": "QNN_TENSOR_VERSION_1", |
|
"info": { |
|
"id": 6, |
|
"name": "past_key_29_in", |
|
"type": "QNN_TENSOR_TYPE_APP_WRITE", |
|
"dataFormat": "QNN_TENSOR_DATA_FORMAT_FLAT_BUFFER", |
|
"dataType": "QNN_DATATYPE_UFIXED_POINT_8", |
|
"rank": 4, |
|
"dimensions": [ |
|
32, |
|
1, |
|
96, |
|
3968 |
|
], |
|
"memType": "QNN_TENSORMEMTYPE_MEMHANDLE", |
|
"quantizeParams": { |
|
"definition": "QNN_DEFINITION_DEFINED", |
|
"quantizationEncoding": "QNN_QUANTIZATION_ENCODING_SCALE_OFFSET", |
|
"scaleOffset": { |
|
"scale": 0.17043833434581757, |
|
"offset": -128 |
|
} |
|
} |
|
} |
|
}, |
|
{ |
|
"version": "QNN_TENSOR_VERSION_1", |
|
"info": { |
|
"id": 9, |
|
"name": "past_value_29_in", |
|
"type": "QNN_TENSOR_TYPE_APP_WRITE", |
|
"dataFormat": "QNN_TENSOR_DATA_FORMAT_FLAT_BUFFER", |
|
"dataType": "QNN_DATATYPE_UFIXED_POINT_8", |
|
"rank": 4, |
|
"dimensions": [ |
|
32, |
|
1, |
|
3968, |
|
96 |
|
], |
|
"memType": "QNN_TENSORMEMTYPE_MEMHANDLE", |
|
"quantizeParams": { |
|
"definition": "QNN_DEFINITION_DEFINED", |
|
"quantizationEncoding": "QNN_QUANTIZATION_ENCODING_SCALE_OFFSET", |
|
"scaleOffset": { |
|
"scale": 0.09825660288333893, |
|
"offset": -128 |
|
} |
|
} |
|
} |
|
}, |
|
{ |
|
"version": "QNN_TENSOR_VERSION_1", |
|
"info": { |
|
"id": 16, |
|
"name": "past_value_24_in", |
|
"type": "QNN_TENSOR_TYPE_APP_WRITE", |
|
"dataFormat": "QNN_TENSOR_DATA_FORMAT_FLAT_BUFFER", |
|
"dataType": "QNN_DATATYPE_UFIXED_POINT_8", |
|
"rank": 4, |
|
"dimensions": [ |
|
32, |
|
1, |
|
3968, |
|
96 |
|
], |
|
"memType": "QNN_TENSORMEMTYPE_MEMHANDLE", |
|
"quantizeParams": { |
|
"definition": "QNN_DEFINITION_DEFINED", |
|
"quantizationEncoding": "QNN_QUANTIZATION_ENCODING_SCALE_OFFSET", |
|
"scaleOffset": { |
|
"scale": 0.07847104221582413, |
|
"offset": -128 |
|
} |
|
} |
|
} |
|
}, |
|
{ |
|
"version": "QNN_TENSOR_VERSION_1", |
|
"info": { |
|
"id": 125, |
|
"name": "past_key_30_in", |
|
"type": "QNN_TENSOR_TYPE_APP_WRITE", |
|
"dataFormat": "QNN_TENSOR_DATA_FORMAT_FLAT_BUFFER", |
|
"dataType": "QNN_DATATYPE_UFIXED_POINT_8", |
|
"rank": 4, |
|
"dimensions": [ |
|
32, |
|
1, |
|
96, |
|
3968 |
|
], |
|
"memType": "QNN_TENSORMEMTYPE_MEMHANDLE", |
|
"quantizeParams": { |
|
"definition": "QNN_DEFINITION_DEFINED", |
|
"quantizationEncoding": "QNN_QUANTIZATION_ENCODING_SCALE_OFFSET", |
|
"scaleOffset": { |
|
"scale": 0.2074936181306839, |
|
"offset": -128 |
|
} |
|
} |
|
} |
|
}, |
|
{ |
|
"version": "QNN_TENSOR_VERSION_1", |
|
"info": { |
|
"id": 128, |
|
"name": "past_value_30_in", |
|
"type": "QNN_TENSOR_TYPE_APP_WRITE", |
|
"dataFormat": "QNN_TENSOR_DATA_FORMAT_FLAT_BUFFER", |
|
"dataType": "QNN_DATATYPE_UFIXED_POINT_8", |
|
"rank": 4, |
|
"dimensions": [ |
|
32, |
|
1, |
|
3968, |
|
96 |
|
], |
|
"memType": "QNN_TENSORMEMTYPE_MEMHANDLE", |
|
"quantizeParams": { |
|
"definition": "QNN_DEFINITION_DEFINED", |
|
"quantizationEncoding": "QNN_QUANTIZATION_ENCODING_SCALE_OFFSET", |
|
"scaleOffset": { |
|
"scale": 0.10411321371793747, |
|
"offset": -128 |
|
} |
|
} |
|
} |
|
}, |
|
{ |
|
"version": "QNN_TENSOR_VERSION_1", |
|
"info": { |
|
"id": 267, |
|
"name": "past_key_31_in", |
|
"type": "QNN_TENSOR_TYPE_APP_WRITE", |
|
"dataFormat": "QNN_TENSOR_DATA_FORMAT_FLAT_BUFFER", |
|
"dataType": "QNN_DATATYPE_UFIXED_POINT_8", |
|
"rank": 4, |
|
"dimensions": [ |
|
32, |
|
1, |
|
96, |
|
3968 |
|
], |
|
"memType": "QNN_TENSORMEMTYPE_MEMHANDLE", |
|
"quantizeParams": { |
|
"definition": "QNN_DEFINITION_DEFINED", |
|
"quantizationEncoding": "QNN_QUANTIZATION_ENCODING_SCALE_OFFSET", |
|
"scaleOffset": { |
|
"scale": 0.18935787677764893, |
|
"offset": -128 |
|
} |
|
} |
|
} |
|
}, |
|
{ |
|
"version": "QNN_TENSOR_VERSION_1", |
|
"info": { |
|
"id": 270, |
|
"name": "past_value_31_in", |
|
"type": "QNN_TENSOR_TYPE_APP_WRITE", |
|
"dataFormat": "QNN_TENSOR_DATA_FORMAT_FLAT_BUFFER", |
|
"dataType": "QNN_DATATYPE_UFIXED_POINT_8", |
|
"rank": 4, |
|
"dimensions": [ |
|
32, |
|
1, |
|
3968, |
|
96 |
|
], |
|
"memType": "QNN_TENSORMEMTYPE_MEMHANDLE", |
|
"quantizeParams": { |
|
"definition": "QNN_DEFINITION_DEFINED", |
|
"quantizationEncoding": "QNN_QUANTIZATION_ENCODING_SCALE_OFFSET", |
|
"scaleOffset": { |
|
"scale": 0.19053252041339875, |
|
"offset": -128 |
|
} |
|
} |
|
} |
|
}, |
|
{ |
|
"version": "QNN_TENSOR_VERSION_1", |
|
"info": { |
|
"id": 441, |
|
"name": "past_key_25_in", |
|
"type": "QNN_TENSOR_TYPE_APP_WRITE", |
|
"dataFormat": "QNN_TENSOR_DATA_FORMAT_FLAT_BUFFER", |
|
"dataType": "QNN_DATATYPE_UFIXED_POINT_8", |
|
"rank": 4, |
|
"dimensions": [ |
|
32, |
|
1, |
|
96, |
|
3968 |
|
], |
|
"memType": "QNN_TENSORMEMTYPE_MEMHANDLE", |
|
"quantizeParams": { |
|
"definition": "QNN_DEFINITION_DEFINED", |
|
"quantizationEncoding": "QNN_QUANTIZATION_ENCODING_SCALE_OFFSET", |
|
"scaleOffset": { |
|
"scale": 0.1846073865890503, |
|
"offset": -128 |
|
} |
|
} |
|
} |
|
}, |
|
{ |
|
"version": "QNN_TENSOR_VERSION_1", |
|
"info": { |
|
"id": 444, |
|
"name": "past_value_25_in", |
|
"type": "QNN_TENSOR_TYPE_APP_WRITE", |
|
"dataFormat": "QNN_TENSOR_DATA_FORMAT_FLAT_BUFFER", |
|
"dataType": "QNN_DATATYPE_UFIXED_POINT_8", |
|
"rank": 4, |
|
"dimensions": [ |
|
32, |
|
1, |
|
3968, |
|
96 |
|
], |
|
"memType": "QNN_TENSORMEMTYPE_MEMHANDLE", |
|
"quantizeParams": { |
|
"definition": "QNN_DEFINITION_DEFINED", |
|
"quantizationEncoding": "QNN_QUANTIZATION_ENCODING_SCALE_OFFSET", |
|
"scaleOffset": { |
|
"scale": 0.09766243398189545, |
|
"offset": -128 |
|
} |
|
} |
|
} |
|
}, |
|
{ |
|
"version": "QNN_TENSOR_VERSION_1", |
|
"info": { |
|
"id": 583, |
|
"name": "past_key_26_in", |
|
"type": "QNN_TENSOR_TYPE_APP_WRITE", |
|
"dataFormat": "QNN_TENSOR_DATA_FORMAT_FLAT_BUFFER", |
|
"dataType": "QNN_DATATYPE_UFIXED_POINT_8", |
|
"rank": 4, |
|
"dimensions": [ |
|
32, |
|
1, |
|
96, |
|
3968 |
|
], |
|
"memType": "QNN_TENSORMEMTYPE_MEMHANDLE", |
|
"quantizeParams": { |
|
"definition": "QNN_DEFINITION_DEFINED", |
|
"quantizationEncoding": "QNN_QUANTIZATION_ENCODING_SCALE_OFFSET", |
|
"scaleOffset": { |
|
"scale": 0.15839417278766633, |
|
"offset": -128 |
|
} |
|
} |
|
} |
|
}, |
|
{ |
|
"version": "QNN_TENSOR_VERSION_1", |
|
"info": { |
|
"id": 586, |
|
"name": "past_value_26_in", |
|
"type": "QNN_TENSOR_TYPE_APP_WRITE", |
|
"dataFormat": "QNN_TENSOR_DATA_FORMAT_FLAT_BUFFER", |
|
"dataType": "QNN_DATATYPE_UFIXED_POINT_8", |
|
"rank": 4, |
|
"dimensions": [ |
|
32, |
|
1, |
|
3968, |
|
96 |
|
], |
|
"memType": "QNN_TENSORMEMTYPE_MEMHANDLE", |
|
"quantizeParams": { |
|
"definition": "QNN_DEFINITION_DEFINED", |
|
"quantizationEncoding": "QNN_QUANTIZATION_ENCODING_SCALE_OFFSET", |
|
"scaleOffset": { |
|
"scale": 0.09959074854850769, |
|
"offset": -128 |
|
} |
|
} |
|
} |
|
}, |
|
{ |
|
"version": "QNN_TENSOR_VERSION_1", |
|
"info": { |
|
"id": 731, |
|
"name": "past_key_27_in", |
|
"type": "QNN_TENSOR_TYPE_APP_WRITE", |
|
"dataFormat": "QNN_TENSOR_DATA_FORMAT_FLAT_BUFFER", |
|
"dataType": "QNN_DATATYPE_UFIXED_POINT_8", |
|
"rank": 4, |
|
"dimensions": [ |
|
32, |
|
1, |
|
96, |
|
3968 |
|
], |
|
"memType": "QNN_TENSORMEMTYPE_MEMHANDLE", |
|
"quantizeParams": { |
|
"definition": "QNN_DEFINITION_DEFINED", |
|
"quantizationEncoding": "QNN_QUANTIZATION_ENCODING_SCALE_OFFSET", |
|
"scaleOffset": { |
|
"scale": 0.15847137570381165, |
|
"offset": -128 |
|
} |
|
} |
|
} |
|
}, |
|
{ |
|
"version": "QNN_TENSOR_VERSION_1", |
|
"info": { |
|
"id": 734, |
|
"name": "past_value_27_in", |
|
"type": "QNN_TENSOR_TYPE_APP_WRITE", |
|
"dataFormat": "QNN_TENSOR_DATA_FORMAT_FLAT_BUFFER", |
|
"dataType": "QNN_DATATYPE_UFIXED_POINT_8", |
|
"rank": 4, |
|
"dimensions": [ |
|
32, |
|
1, |
|
3968, |
|
96 |
|
], |
|
"memType": "QNN_TENSORMEMTYPE_MEMHANDLE", |
|
"quantizeParams": { |
|
"definition": "QNN_DEFINITION_DEFINED", |
|
"quantizationEncoding": "QNN_QUANTIZATION_ENCODING_SCALE_OFFSET", |
|
"scaleOffset": { |
|
"scale": 0.08399864286184311, |
|
"offset": -128 |
|
} |
|
} |
|
} |
|
}, |
|
{ |
|
"version": "QNN_TENSOR_VERSION_1", |
|
"info": { |
|
"id": 875, |
|
"name": "past_key_28_in", |
|
"type": "QNN_TENSOR_TYPE_APP_WRITE", |
|
"dataFormat": "QNN_TENSOR_DATA_FORMAT_FLAT_BUFFER", |
|
"dataType": "QNN_DATATYPE_UFIXED_POINT_8", |
|
"rank": 4, |
|
"dimensions": [ |
|
32, |
|
1, |
|
96, |
|
3968 |
|
], |
|
"memType": "QNN_TENSORMEMTYPE_MEMHANDLE", |
|
"quantizeParams": { |
|
"definition": "QNN_DEFINITION_DEFINED", |
|
"quantizationEncoding": "QNN_QUANTIZATION_ENCODING_SCALE_OFFSET", |
|
"scaleOffset": { |
|
"scale": 0.1828504055738449, |
|
"offset": -128 |
|
} |
|
} |
|
} |
|
}, |
|
{ |
|
"version": "QNN_TENSOR_VERSION_1", |
|
"info": { |
|
"id": 878, |
|
"name": "past_value_28_in", |
|
"type": "QNN_TENSOR_TYPE_APP_WRITE", |
|
"dataFormat": "QNN_TENSOR_DATA_FORMAT_FLAT_BUFFER", |
|
"dataType": "QNN_DATATYPE_UFIXED_POINT_8", |
|
"rank": 4, |
|
"dimensions": [ |
|
32, |
|
1, |
|
3968, |
|
96 |
|
], |
|
"memType": "QNN_TENSORMEMTYPE_MEMHANDLE", |
|
"quantizeParams": { |
|
"definition": "QNN_DEFINITION_DEFINED", |
|
"quantizationEncoding": "QNN_QUANTIZATION_ENCODING_SCALE_OFFSET", |
|
"scaleOffset": { |
|
"scale": 0.09687352180480957, |
|
"offset": -128 |
|
} |
|
} |
|
} |
|
}, |
|
{ |
|
"version": "QNN_TENSOR_VERSION_1", |
|
"info": { |
|
"id": 1041, |
|
"name": "_model_layers_23_Add_1_Add_output_0", |
|
"type": "QNN_TENSOR_TYPE_APP_WRITE", |
|
"dataFormat": "QNN_TENSOR_DATA_FORMAT_FLAT_BUFFER", |
|
"dataType": "QNN_DATATYPE_UFIXED_POINT_16", |
|
"rank": 3, |
|
"dimensions": [ |
|
1, |
|
128, |
|
3072 |
|
], |
|
"memType": "QNN_TENSORMEMTYPE_MEMHANDLE", |
|
"quantizeParams": { |
|
"definition": "QNN_DEFINITION_DEFINED", |
|
"quantizationEncoding": "QNN_QUANTIZATION_ENCODING_SCALE_OFFSET", |
|
"scaleOffset": { |
|
"scale": 0.191017746925354, |
|
"offset": -41581 |
|
} |
|
} |
|
} |
|
}, |
|
{ |
|
"version": "QNN_TENSOR_VERSION_1", |
|
"info": { |
|
"id": 1946, |
|
"name": "position_ids_cos", |
|
"type": "QNN_TENSOR_TYPE_APP_WRITE", |
|
"dataFormat": "QNN_TENSOR_DATA_FORMAT_FLAT_BUFFER", |
|
"dataType": "QNN_DATATYPE_UFIXED_POINT_16", |
|
"rank": 4, |
|
"dimensions": [ |
|
1, |
|
1, |
|
128, |
|
48 |
|
], |
|
"memType": "QNN_TENSORMEMTYPE_MEMHANDLE", |
|
"quantizeParams": { |
|
"definition": "QNN_DEFINITION_DEFINED", |
|
"quantizationEncoding": "QNN_QUANTIZATION_ENCODING_SCALE_OFFSET", |
|
"scaleOffset": { |
|
"scale": 0.00003632373773143627, |
|
"offset": -32768 |
|
} |
|
} |
|
} |
|
}, |
|
{ |
|
"version": "QNN_TENSOR_VERSION_1", |
|
"info": { |
|
"id": 1948, |
|
"name": "position_ids_sin", |
|
"type": "QNN_TENSOR_TYPE_APP_WRITE", |
|
"dataFormat": "QNN_TENSOR_DATA_FORMAT_FLAT_BUFFER", |
|
"dataType": "QNN_DATATYPE_UFIXED_POINT_16", |
|
"rank": 4, |
|
"dimensions": [ |
|
1, |
|
1, |
|
128, |
|
48 |
|
], |
|
"memType": "QNN_TENSORMEMTYPE_MEMHANDLE", |
|
"quantizeParams": { |
|
"definition": "QNN_DEFINITION_DEFINED", |
|
"quantizationEncoding": "QNN_QUANTIZATION_ENCODING_SCALE_OFFSET", |
|
"scaleOffset": { |
|
"scale": 0.00003632373773143627, |
|
"offset": -32768 |
|
} |
|
} |
|
} |
|
}, |
|
{ |
|
"version": "QNN_TENSOR_VERSION_1", |
|
"info": { |
|
"id": 2653, |
|
"name": "attention_mask", |
|
"type": "QNN_TENSOR_TYPE_APP_WRITE", |
|
"dataFormat": "QNN_TENSOR_DATA_FORMAT_FLAT_BUFFER", |
|
"dataType": "QNN_DATATYPE_UFIXED_POINT_16", |
|
"rank": 4, |
|
"dimensions": [ |
|
1, |
|
1, |
|
128, |
|
4096 |
|
], |
|
"memType": "QNN_TENSORMEMTYPE_MEMHANDLE", |
|
"quantizeParams": { |
|
"definition": "QNN_DEFINITION_DEFINED", |
|
"quantizationEncoding": "QNN_QUANTIZATION_ENCODING_SCALE_OFFSET", |
|
"scaleOffset": { |
|
"scale": 0.0007629510946571827, |
|
"offset": -65535 |
|
} |
|
} |
|
} |
|
} |
|
], |
|
"numGraphOutputs": 17, |
|
"graphOutputs": [ |
|
{ |
|
"version": "QNN_TENSOR_VERSION_1", |
|
"info": { |
|
"id": 1913, |
|
"name": "past_value_24_out", |
|
"type": "QNN_TENSOR_TYPE_APP_READ", |
|
"dataFormat": "QNN_TENSOR_DATA_FORMAT_FLAT_BUFFER", |
|
"dataType": "QNN_DATATYPE_UFIXED_POINT_8", |
|
"rank": 4, |
|
"dimensions": [ |
|
32, |
|
1, |
|
128, |
|
96 |
|
], |
|
"memType": "QNN_TENSORMEMTYPE_MEMHANDLE", |
|
"quantizeParams": { |
|
"definition": "QNN_DEFINITION_DEFINED", |
|
"quantizationEncoding": "QNN_QUANTIZATION_ENCODING_SCALE_OFFSET", |
|
"scaleOffset": { |
|
"scale": 0.07847104221582413, |
|
"offset": -128 |
|
} |
|
} |
|
} |
|
}, |
|
{ |
|
"version": "QNN_TENSOR_VERSION_1", |
|
"info": { |
|
"id": 2556, |
|
"name": "past_key_24_out", |
|
"type": "QNN_TENSOR_TYPE_APP_READ", |
|
"dataFormat": "QNN_TENSOR_DATA_FORMAT_FLAT_BUFFER", |
|
"dataType": "QNN_DATATYPE_UFIXED_POINT_8", |
|
"rank": 4, |
|
"dimensions": [ |
|
32, |
|
1, |
|
96, |
|
128 |
|
], |
|
"memType": "QNN_TENSORMEMTYPE_MEMHANDLE", |
|
"quantizeParams": { |
|
"definition": "QNN_DEFINITION_DEFINED", |
|
"quantizationEncoding": "QNN_QUANTIZATION_ENCODING_SCALE_OFFSET", |
|
"scaleOffset": { |
|
"scale": 0.16835589706897736, |
|
"offset": -128 |
|
} |
|
} |
|
} |
|
}, |
|
{ |
|
"version": "QNN_TENSOR_VERSION_1", |
|
"info": { |
|
"id": 3676, |
|
"name": "past_value_25_out", |
|
"type": "QNN_TENSOR_TYPE_APP_READ", |
|
"dataFormat": "QNN_TENSOR_DATA_FORMAT_FLAT_BUFFER", |
|
"dataType": "QNN_DATATYPE_UFIXED_POINT_8", |
|
"rank": 4, |
|
"dimensions": [ |
|
32, |
|
1, |
|
128, |
|
96 |
|
], |
|
"memType": "QNN_TENSORMEMTYPE_MEMHANDLE", |
|
"quantizeParams": { |
|
"definition": "QNN_DEFINITION_DEFINED", |
|
"quantizationEncoding": "QNN_QUANTIZATION_ENCODING_SCALE_OFFSET", |
|
"scaleOffset": { |
|
"scale": 0.09766243398189545, |
|
"offset": -128 |
|
} |
|
} |
|
} |
|
}, |
|
{ |
|
"version": "QNN_TENSOR_VERSION_1", |
|
"info": { |
|
"id": 4317, |
|
"name": "past_key_25_out", |
|
"type": "QNN_TENSOR_TYPE_APP_READ", |
|
"dataFormat": "QNN_TENSOR_DATA_FORMAT_FLAT_BUFFER", |
|
"dataType": "QNN_DATATYPE_UFIXED_POINT_8", |
|
"rank": 4, |
|
"dimensions": [ |
|
32, |
|
1, |
|
96, |
|
128 |
|
], |
|
"memType": "QNN_TENSORMEMTYPE_MEMHANDLE", |
|
"quantizeParams": { |
|
"definition": "QNN_DEFINITION_DEFINED", |
|
"quantizationEncoding": "QNN_QUANTIZATION_ENCODING_SCALE_OFFSET", |
|
"scaleOffset": { |
|
"scale": 0.1846073865890503, |
|
"offset": -128 |
|
} |
|
} |
|
} |
|
}, |
|
{ |
|
"version": "QNN_TENSOR_VERSION_1", |
|
"info": { |
|
"id": 5436, |
|
"name": "past_value_26_out", |
|
"type": "QNN_TENSOR_TYPE_APP_READ", |
|
"dataFormat": "QNN_TENSOR_DATA_FORMAT_FLAT_BUFFER", |
|
"dataType": "QNN_DATATYPE_UFIXED_POINT_8", |
|
"rank": 4, |
|
"dimensions": [ |
|
32, |
|
1, |
|
128, |
|
96 |
|
], |
|
"memType": "QNN_TENSORMEMTYPE_MEMHANDLE", |
|
"quantizeParams": { |
|
"definition": "QNN_DEFINITION_DEFINED", |
|
"quantizationEncoding": "QNN_QUANTIZATION_ENCODING_SCALE_OFFSET", |
|
"scaleOffset": { |
|
"scale": 0.09959074854850769, |
|
"offset": -128 |
|
} |
|
} |
|
} |
|
}, |
|
{ |
|
"version": "QNN_TENSOR_VERSION_1", |
|
"info": { |
|
"id": 6077, |
|
"name": "past_key_26_out", |
|
"type": "QNN_TENSOR_TYPE_APP_READ", |
|
"dataFormat": "QNN_TENSOR_DATA_FORMAT_FLAT_BUFFER", |
|
"dataType": "QNN_DATATYPE_UFIXED_POINT_8", |
|
"rank": 4, |
|
"dimensions": [ |
|
32, |
|
1, |
|
96, |
|
128 |
|
], |
|
"memType": "QNN_TENSORMEMTYPE_MEMHANDLE", |
|
"quantizeParams": { |
|
"definition": "QNN_DEFINITION_DEFINED", |
|
"quantizationEncoding": "QNN_QUANTIZATION_ENCODING_SCALE_OFFSET", |
|
"scaleOffset": { |
|
"scale": 0.15839417278766633, |
|
"offset": -128 |
|
} |
|
} |
|
} |
|
}, |
|
{ |
|
"version": "QNN_TENSOR_VERSION_1", |
|
"info": { |
|
"id": 7196, |
|
"name": "past_value_27_out", |
|
"type": "QNN_TENSOR_TYPE_APP_READ", |
|
"dataFormat": "QNN_TENSOR_DATA_FORMAT_FLAT_BUFFER", |
|
"dataType": "QNN_DATATYPE_UFIXED_POINT_8", |
|
"rank": 4, |
|
"dimensions": [ |
|
32, |
|
1, |
|
128, |
|
96 |
|
], |
|
"memType": "QNN_TENSORMEMTYPE_MEMHANDLE", |
|
"quantizeParams": { |
|
"definition": "QNN_DEFINITION_DEFINED", |
|
"quantizationEncoding": "QNN_QUANTIZATION_ENCODING_SCALE_OFFSET", |
|
"scaleOffset": { |
|
"scale": 0.08399864286184311, |
|
"offset": -128 |
|
} |
|
} |
|
} |
|
}, |
|
{ |
|
"version": "QNN_TENSOR_VERSION_1", |
|
"info": { |
|
"id": 7837, |
|
"name": "past_key_27_out", |
|
"type": "QNN_TENSOR_TYPE_APP_READ", |
|
"dataFormat": "QNN_TENSOR_DATA_FORMAT_FLAT_BUFFER", |
|
"dataType": "QNN_DATATYPE_UFIXED_POINT_8", |
|
"rank": 4, |
|
"dimensions": [ |
|
32, |
|
1, |
|
96, |
|
128 |
|
], |
|
"memType": "QNN_TENSORMEMTYPE_MEMHANDLE", |
|
"quantizeParams": { |
|
"definition": "QNN_DEFINITION_DEFINED", |
|
"quantizationEncoding": "QNN_QUANTIZATION_ENCODING_SCALE_OFFSET", |
|
"scaleOffset": { |
|
"scale": 0.15847137570381165, |
|
"offset": -128 |
|
} |
|
} |
|
} |
|
}, |
|
{ |
|
"version": "QNN_TENSOR_VERSION_1", |
|
"info": { |
|
"id": 8956, |
|
"name": "past_value_28_out", |
|
"type": "QNN_TENSOR_TYPE_APP_READ", |
|
"dataFormat": "QNN_TENSOR_DATA_FORMAT_FLAT_BUFFER", |
|
"dataType": "QNN_DATATYPE_UFIXED_POINT_8", |
|
"rank": 4, |
|
"dimensions": [ |
|
32, |
|
1, |
|
128, |
|
96 |
|
], |
|
"memType": "QNN_TENSORMEMTYPE_MEMHANDLE", |
|
"quantizeParams": { |
|
"definition": "QNN_DEFINITION_DEFINED", |
|
"quantizationEncoding": "QNN_QUANTIZATION_ENCODING_SCALE_OFFSET", |
|
"scaleOffset": { |
|
"scale": 0.09687352180480957, |
|
"offset": -128 |
|
} |
|
} |
|
} |
|
}, |
|
{ |
|
"version": "QNN_TENSOR_VERSION_1", |
|
"info": { |
|
"id": 9597, |
|
"name": "past_key_28_out", |
|
"type": "QNN_TENSOR_TYPE_APP_READ", |
|
"dataFormat": "QNN_TENSOR_DATA_FORMAT_FLAT_BUFFER", |
|
"dataType": "QNN_DATATYPE_UFIXED_POINT_8", |
|
"rank": 4, |
|
"dimensions": [ |
|
32, |
|
1, |
|
96, |
|
128 |
|
], |
|
"memType": "QNN_TENSORMEMTYPE_MEMHANDLE", |
|
"quantizeParams": { |
|
"definition": "QNN_DEFINITION_DEFINED", |
|
"quantizationEncoding": "QNN_QUANTIZATION_ENCODING_SCALE_OFFSET", |
|
"scaleOffset": { |
|
"scale": 0.1828504055738449, |
|
"offset": -128 |
|
} |
|
} |
|
} |
|
}, |
|
{ |
|
"version": "QNN_TENSOR_VERSION_1", |
|
"info": { |
|
"id": 10716, |
|
"name": "past_value_29_out", |
|
"type": "QNN_TENSOR_TYPE_APP_READ", |
|
"dataFormat": "QNN_TENSOR_DATA_FORMAT_FLAT_BUFFER", |
|
"dataType": "QNN_DATATYPE_UFIXED_POINT_8", |
|
"rank": 4, |
|
"dimensions": [ |
|
32, |
|
1, |
|
128, |
|
96 |
|
], |
|
"memType": "QNN_TENSORMEMTYPE_MEMHANDLE", |
|
"quantizeParams": { |
|
"definition": "QNN_DEFINITION_DEFINED", |
|
"quantizationEncoding": "QNN_QUANTIZATION_ENCODING_SCALE_OFFSET", |
|
"scaleOffset": { |
|
"scale": 0.09825660288333893, |
|
"offset": -128 |
|
} |
|
} |
|
} |
|
}, |
|
{ |
|
"version": "QNN_TENSOR_VERSION_1", |
|
"info": { |
|
"id": 11357, |
|
"name": "past_key_29_out", |
|
"type": "QNN_TENSOR_TYPE_APP_READ", |
|
"dataFormat": "QNN_TENSOR_DATA_FORMAT_FLAT_BUFFER", |
|
"dataType": "QNN_DATATYPE_UFIXED_POINT_8", |
|
"rank": 4, |
|
"dimensions": [ |
|
32, |
|
1, |
|
96, |
|
128 |
|
], |
|
"memType": "QNN_TENSORMEMTYPE_MEMHANDLE", |
|
"quantizeParams": { |
|
"definition": "QNN_DEFINITION_DEFINED", |
|
"quantizationEncoding": "QNN_QUANTIZATION_ENCODING_SCALE_OFFSET", |
|
"scaleOffset": { |
|
"scale": 0.17043833434581757, |
|
"offset": -128 |
|
} |
|
} |
|
} |
|
}, |
|
{ |
|
"version": "QNN_TENSOR_VERSION_1", |
|
"info": { |
|
"id": 12476, |
|
"name": "past_value_30_out", |
|
"type": "QNN_TENSOR_TYPE_APP_READ", |
|
"dataFormat": "QNN_TENSOR_DATA_FORMAT_FLAT_BUFFER", |
|
"dataType": "QNN_DATATYPE_UFIXED_POINT_8", |
|
"rank": 4, |
|
"dimensions": [ |
|
32, |
|
1, |
|
128, |
|
96 |
|
], |
|
"memType": "QNN_TENSORMEMTYPE_MEMHANDLE", |
|
"quantizeParams": { |
|
"definition": "QNN_DEFINITION_DEFINED", |
|
"quantizationEncoding": "QNN_QUANTIZATION_ENCODING_SCALE_OFFSET", |
|
"scaleOffset": { |
|
"scale": 0.10411321371793747, |
|
"offset": -128 |
|
} |
|
} |
|
} |
|
}, |
|
{ |
|
"version": "QNN_TENSOR_VERSION_1", |
|
"info": { |
|
"id": 13117, |
|
"name": "past_key_30_out", |
|
"type": "QNN_TENSOR_TYPE_APP_READ", |
|
"dataFormat": "QNN_TENSOR_DATA_FORMAT_FLAT_BUFFER", |
|
"dataType": "QNN_DATATYPE_UFIXED_POINT_8", |
|
"rank": 4, |
|
"dimensions": [ |
|
32, |
|
1, |
|
96, |
|
128 |
|
], |
|
"memType": "QNN_TENSORMEMTYPE_MEMHANDLE", |
|
"quantizeParams": { |
|
"definition": "QNN_DEFINITION_DEFINED", |
|
"quantizationEncoding": "QNN_QUANTIZATION_ENCODING_SCALE_OFFSET", |
|
"scaleOffset": { |
|
"scale": 0.2074936181306839, |
|
"offset": -128 |
|
} |
|
} |
|
} |
|
}, |
|
{ |
|
"version": "QNN_TENSOR_VERSION_1", |
|
"info": { |
|
"id": 14236, |
|
"name": "past_value_31_out", |
|
"type": "QNN_TENSOR_TYPE_APP_READ", |
|
"dataFormat": "QNN_TENSOR_DATA_FORMAT_FLAT_BUFFER", |
|
"dataType": "QNN_DATATYPE_UFIXED_POINT_8", |
|
"rank": 4, |
|
"dimensions": [ |
|
32, |
|
1, |
|
128, |
|
96 |
|
], |
|
"memType": "QNN_TENSORMEMTYPE_MEMHANDLE", |
|
"quantizeParams": { |
|
"definition": "QNN_DEFINITION_DEFINED", |
|
"quantizationEncoding": "QNN_QUANTIZATION_ENCODING_SCALE_OFFSET", |
|
"scaleOffset": { |
|
"scale": 0.19053252041339875, |
|
"offset": -128 |
|
} |
|
} |
|
} |
|
}, |
|
{ |
|
"version": "QNN_TENSOR_VERSION_1", |
|
"info": { |
|
"id": 14877, |
|
"name": "past_key_31_out", |
|
"type": "QNN_TENSOR_TYPE_APP_READ", |
|
"dataFormat": "QNN_TENSOR_DATA_FORMAT_FLAT_BUFFER", |
|
"dataType": "QNN_DATATYPE_UFIXED_POINT_8", |
|
"rank": 4, |
|
"dimensions": [ |
|
32, |
|
1, |
|
96, |
|
128 |
|
], |
|
"memType": "QNN_TENSORMEMTYPE_MEMHANDLE", |
|
"quantizeParams": { |
|
"definition": "QNN_DEFINITION_DEFINED", |
|
"quantizationEncoding": "QNN_QUANTIZATION_ENCODING_SCALE_OFFSET", |
|
"scaleOffset": { |
|
"scale": 0.18935787677764893, |
|
"offset": -128 |
|
} |
|
} |
|
} |
|
}, |
|
{ |
|
"version": "QNN_TENSOR_VERSION_1", |
|
"info": { |
|
"id": 15140, |
|
"name": "logits", |
|
"type": "QNN_TENSOR_TYPE_APP_READ", |
|
"dataFormat": "QNN_TENSOR_DATA_FORMAT_FLAT_BUFFER", |
|
"dataType": "QNN_DATATYPE_UFIXED_POINT_16", |
|
"rank": 3, |
|
"dimensions": [ |
|
1, |
|
128, |
|
32064 |
|
], |
|
"memType": "QNN_TENSORMEMTYPE_MEMHANDLE", |
|
"quantizeParams": { |
|
"definition": "QNN_DEFINITION_DEFINED", |
|
"quantizationEncoding": "QNN_QUANTIZATION_ENCODING_SCALE_OFFSET", |
|
"scaleOffset": { |
|
"scale": 0.001873409142717719, |
|
"offset": -26111 |
|
} |
|
} |
|
} |
|
} |
|
], |
|
"numUpdateableTensors": 0, |
|
"updateableTensors": [], |
|
"graphBlobInfoSize": 40, |
|
"graphBlobInfo": [ |
|
{ |
|
"version": "QNN_SYSTEM_CONTEXT_HTP_GRAPH_INFO_BLOB_VERSION_V1", |
|
"info": { |
|
"spillFillBufferSize": 0, |
|
"optimizationLevel": 3, |
|
"vtcmSize": 8, |
|
"htpDlbc": 0, |
|
"numHvxThreads": 0 |
|
} |
|
} |
|
] |
|
} |
|
}, |
|
{ |
|
"version": "QNN_SYSTEM_CONTEXT_GRAPH_INFO_VERSION_3", |
|
"info": { |
|
"graphName": "ar1_cl4096_4_of_4", |
|
"numGraphInputs": 20, |
|
"graphInputs": [ |
|
{ |
|
"version": "QNN_TENSOR_VERSION_1", |
|
"info": { |
|
"id": 15141, |
|
"name": "past_key_24_in", |
|
"type": "QNN_TENSOR_TYPE_APP_WRITE", |
|
"dataFormat": "QNN_TENSOR_DATA_FORMAT_FLAT_BUFFER", |
|
"dataType": "QNN_DATATYPE_UFIXED_POINT_8", |
|
"rank": 4, |
|
"dimensions": [ |
|
32, |
|
1, |
|
96, |
|
4095 |
|
], |
|
"memType": "QNN_TENSORMEMTYPE_MEMHANDLE", |
|
"quantizeParams": { |
|
"definition": "QNN_DEFINITION_DEFINED", |
|
"quantizationEncoding": "QNN_QUANTIZATION_ENCODING_SCALE_OFFSET", |
|
"scaleOffset": { |
|
"scale": 0.16835589706897736, |
|
"offset": -128 |
|
} |
|
} |
|
} |
|
}, |
|
{ |
|
"version": "QNN_TENSOR_VERSION_1", |
|
"info": { |
|
"id": 15146, |
|
"name": "past_key_29_in", |
|
"type": "QNN_TENSOR_TYPE_APP_WRITE", |
|
"dataFormat": "QNN_TENSOR_DATA_FORMAT_FLAT_BUFFER", |
|
"dataType": "QNN_DATATYPE_UFIXED_POINT_8", |
|
"rank": 4, |
|
"dimensions": [ |
|
32, |
|
1, |
|
96, |
|
4095 |
|
], |
|
"memType": "QNN_TENSORMEMTYPE_MEMHANDLE", |
|
"quantizeParams": { |
|
"definition": "QNN_DEFINITION_DEFINED", |
|
"quantizationEncoding": "QNN_QUANTIZATION_ENCODING_SCALE_OFFSET", |
|
"scaleOffset": { |
|
"scale": 0.17043833434581757, |
|
"offset": -128 |
|
} |
|
} |
|
} |
|
}, |
|
{ |
|
"version": "QNN_TENSOR_VERSION_1", |
|
"info": { |
|
"id": 15149, |
|
"name": "past_value_29_in", |
|
"type": "QNN_TENSOR_TYPE_APP_WRITE", |
|
"dataFormat": "QNN_TENSOR_DATA_FORMAT_FLAT_BUFFER", |
|
"dataType": "QNN_DATATYPE_UFIXED_POINT_8", |
|
"rank": 4, |
|
"dimensions": [ |
|
32, |
|
1, |
|
4095, |
|
96 |
|
], |
|
"memType": "QNN_TENSORMEMTYPE_MEMHANDLE", |
|
"quantizeParams": { |
|
"definition": "QNN_DEFINITION_DEFINED", |
|
"quantizationEncoding": "QNN_QUANTIZATION_ENCODING_SCALE_OFFSET", |
|
"scaleOffset": { |
|
"scale": 0.09825660288333893, |
|
"offset": -128 |
|
} |
|
} |
|
} |
|
}, |
|
{ |
|
"version": "QNN_TENSOR_VERSION_1", |
|
"info": { |
|
"id": 15156, |
|
"name": "past_value_24_in", |
|
"type": "QNN_TENSOR_TYPE_APP_WRITE", |
|
"dataFormat": "QNN_TENSOR_DATA_FORMAT_FLAT_BUFFER", |
|
"dataType": "QNN_DATATYPE_UFIXED_POINT_8", |
|
"rank": 4, |
|
"dimensions": [ |
|
32, |
|
1, |
|
4095, |
|
96 |
|
], |
|
"memType": "QNN_TENSORMEMTYPE_MEMHANDLE", |
|
"quantizeParams": { |
|
"definition": "QNN_DEFINITION_DEFINED", |
|
"quantizationEncoding": "QNN_QUANTIZATION_ENCODING_SCALE_OFFSET", |
|
"scaleOffset": { |
|
"scale": 0.07847104221582413, |
|
"offset": -128 |
|
} |
|
} |
|
} |
|
}, |
|
{ |
|
"version": "QNN_TENSOR_VERSION_1", |
|
"info": { |
|
"id": 15265, |
|
"name": "past_key_30_in", |
|
"type": "QNN_TENSOR_TYPE_APP_WRITE", |
|
"dataFormat": "QNN_TENSOR_DATA_FORMAT_FLAT_BUFFER", |
|
"dataType": "QNN_DATATYPE_UFIXED_POINT_8", |
|
"rank": 4, |
|
"dimensions": [ |
|
32, |
|
1, |
|
96, |
|
4095 |
|
], |
|
"memType": "QNN_TENSORMEMTYPE_MEMHANDLE", |
|
"quantizeParams": { |
|
"definition": "QNN_DEFINITION_DEFINED", |
|
"quantizationEncoding": "QNN_QUANTIZATION_ENCODING_SCALE_OFFSET", |
|
"scaleOffset": { |
|
"scale": 0.2074936181306839, |
|
"offset": -128 |
|
} |
|
} |
|
} |
|
}, |
|
{ |
|
"version": "QNN_TENSOR_VERSION_1", |
|
"info": { |
|
"id": 15268, |
|
"name": "past_value_30_in", |
|
"type": "QNN_TENSOR_TYPE_APP_WRITE", |
|
"dataFormat": "QNN_TENSOR_DATA_FORMAT_FLAT_BUFFER", |
|
"dataType": "QNN_DATATYPE_UFIXED_POINT_8", |
|
"rank": 4, |
|
"dimensions": [ |
|
32, |
|
1, |
|
4095, |
|
96 |
|
], |
|
"memType": "QNN_TENSORMEMTYPE_MEMHANDLE", |
|
"quantizeParams": { |
|
"definition": "QNN_DEFINITION_DEFINED", |
|
"quantizationEncoding": "QNN_QUANTIZATION_ENCODING_SCALE_OFFSET", |
|
"scaleOffset": { |
|
"scale": 0.10411321371793747, |
|
"offset": -128 |
|
} |
|
} |
|
} |
|
}, |
|
{ |
|
"version": "QNN_TENSOR_VERSION_1", |
|
"info": { |
|
"id": 15407, |
|
"name": "past_key_31_in", |
|
"type": "QNN_TENSOR_TYPE_APP_WRITE", |
|
"dataFormat": "QNN_TENSOR_DATA_FORMAT_FLAT_BUFFER", |
|
"dataType": "QNN_DATATYPE_UFIXED_POINT_8", |
|
"rank": 4, |
|
"dimensions": [ |
|
32, |
|
1, |
|
96, |
|
4095 |
|
], |
|
"memType": "QNN_TENSORMEMTYPE_MEMHANDLE", |
|
"quantizeParams": { |
|
"definition": "QNN_DEFINITION_DEFINED", |
|
"quantizationEncoding": "QNN_QUANTIZATION_ENCODING_SCALE_OFFSET", |
|
"scaleOffset": { |
|
"scale": 0.18935787677764893, |
|
"offset": -128 |
|
} |
|
} |
|
} |
|
}, |
|
{ |
|
"version": "QNN_TENSOR_VERSION_1", |
|
"info": { |
|
"id": 15410, |
|
"name": "past_value_31_in", |
|
"type": "QNN_TENSOR_TYPE_APP_WRITE", |
|
"dataFormat": "QNN_TENSOR_DATA_FORMAT_FLAT_BUFFER", |
|
"dataType": "QNN_DATATYPE_UFIXED_POINT_8", |
|
"rank": 4, |
|
"dimensions": [ |
|
32, |
|
1, |
|
4095, |
|
96 |
|
], |
|
"memType": "QNN_TENSORMEMTYPE_MEMHANDLE", |
|
"quantizeParams": { |
|
"definition": "QNN_DEFINITION_DEFINED", |
|
"quantizationEncoding": "QNN_QUANTIZATION_ENCODING_SCALE_OFFSET", |
|
"scaleOffset": { |
|
"scale": 0.19053252041339875, |
|
"offset": -128 |
|
} |
|
} |
|
} |
|
}, |
|
{ |
|
"version": "QNN_TENSOR_VERSION_1", |
|
"info": { |
|
"id": 15581, |
|
"name": "past_key_25_in", |
|
"type": "QNN_TENSOR_TYPE_APP_WRITE", |
|
"dataFormat": "QNN_TENSOR_DATA_FORMAT_FLAT_BUFFER", |
|
"dataType": "QNN_DATATYPE_UFIXED_POINT_8", |
|
"rank": 4, |
|
"dimensions": [ |
|
32, |
|
1, |
|
96, |
|
4095 |
|
], |
|
"memType": "QNN_TENSORMEMTYPE_MEMHANDLE", |
|
"quantizeParams": { |
|
"definition": "QNN_DEFINITION_DEFINED", |
|
"quantizationEncoding": "QNN_QUANTIZATION_ENCODING_SCALE_OFFSET", |
|
"scaleOffset": { |
|
"scale": 0.1846073865890503, |
|
"offset": -128 |
|
} |
|
} |
|
} |
|
}, |
|
{ |
|
"version": "QNN_TENSOR_VERSION_1", |
|
"info": { |
|
"id": 15584, |
|
"name": "past_value_25_in", |
|
"type": "QNN_TENSOR_TYPE_APP_WRITE", |
|
"dataFormat": "QNN_TENSOR_DATA_FORMAT_FLAT_BUFFER", |
|
"dataType": "QNN_DATATYPE_UFIXED_POINT_8", |
|
"rank": 4, |
|
"dimensions": [ |
|
32, |
|
1, |
|
4095, |
|
96 |
|
], |
|
"memType": "QNN_TENSORMEMTYPE_MEMHANDLE", |
|
"quantizeParams": { |
|
"definition": "QNN_DEFINITION_DEFINED", |
|
"quantizationEncoding": "QNN_QUANTIZATION_ENCODING_SCALE_OFFSET", |
|
"scaleOffset": { |
|
"scale": 0.09766243398189545, |
|
"offset": -128 |
|
} |
|
} |
|
} |
|
}, |
|
{ |
|
"version": "QNN_TENSOR_VERSION_1", |
|
"info": { |
|
"id": 15723, |
|
"name": "past_key_26_in", |
|
"type": "QNN_TENSOR_TYPE_APP_WRITE", |
|
"dataFormat": "QNN_TENSOR_DATA_FORMAT_FLAT_BUFFER", |
|
"dataType": "QNN_DATATYPE_UFIXED_POINT_8", |
|
"rank": 4, |
|
"dimensions": [ |
|
32, |
|
1, |
|
96, |
|
4095 |
|
], |
|
"memType": "QNN_TENSORMEMTYPE_MEMHANDLE", |
|
"quantizeParams": { |
|
"definition": "QNN_DEFINITION_DEFINED", |
|
"quantizationEncoding": "QNN_QUANTIZATION_ENCODING_SCALE_OFFSET", |
|
"scaleOffset": { |
|
"scale": 0.15839417278766633, |
|
"offset": -128 |
|
} |
|
} |
|
} |
|
}, |
|
{ |
|
"version": "QNN_TENSOR_VERSION_1", |
|
"info": { |
|
"id": 15726, |
|
"name": "past_value_26_in", |
|
"type": "QNN_TENSOR_TYPE_APP_WRITE", |
|
"dataFormat": "QNN_TENSOR_DATA_FORMAT_FLAT_BUFFER", |
|
"dataType": "QNN_DATATYPE_UFIXED_POINT_8", |
|
"rank": 4, |
|
"dimensions": [ |
|
32, |
|
1, |
|
4095, |
|
96 |
|
], |
|
"memType": "QNN_TENSORMEMTYPE_MEMHANDLE", |
|
"quantizeParams": { |
|
"definition": "QNN_DEFINITION_DEFINED", |
|
"quantizationEncoding": "QNN_QUANTIZATION_ENCODING_SCALE_OFFSET", |
|
"scaleOffset": { |
|
"scale": 0.09959074854850769, |
|
"offset": -128 |
|
} |
|
} |
|
} |
|
}, |
|
{ |
|
"version": "QNN_TENSOR_VERSION_1", |
|
"info": { |
|
"id": 15871, |
|
"name": "past_key_27_in", |
|
"type": "QNN_TENSOR_TYPE_APP_WRITE", |
|
"dataFormat": "QNN_TENSOR_DATA_FORMAT_FLAT_BUFFER", |
|
"dataType": "QNN_DATATYPE_UFIXED_POINT_8", |
|
"rank": 4, |
|
"dimensions": [ |
|
32, |
|
1, |
|
96, |
|
4095 |
|
], |
|
"memType": "QNN_TENSORMEMTYPE_MEMHANDLE", |
|
"quantizeParams": { |
|
"definition": "QNN_DEFINITION_DEFINED", |
|
"quantizationEncoding": "QNN_QUANTIZATION_ENCODING_SCALE_OFFSET", |
|
"scaleOffset": { |
|
"scale": 0.15847137570381165, |
|
"offset": -128 |
|
} |
|
} |
|
} |
|
}, |
|
{ |
|
"version": "QNN_TENSOR_VERSION_1", |
|
"info": { |
|
"id": 15874, |
|
"name": "past_value_27_in", |
|
"type": "QNN_TENSOR_TYPE_APP_WRITE", |
|
"dataFormat": "QNN_TENSOR_DATA_FORMAT_FLAT_BUFFER", |
|
"dataType": "QNN_DATATYPE_UFIXED_POINT_8", |
|
"rank": 4, |
|
"dimensions": [ |
|
32, |
|
1, |
|
4095, |
|
96 |
|
], |
|
"memType": "QNN_TENSORMEMTYPE_MEMHANDLE", |
|
"quantizeParams": { |
|
"definition": "QNN_DEFINITION_DEFINED", |
|
"quantizationEncoding": "QNN_QUANTIZATION_ENCODING_SCALE_OFFSET", |
|
"scaleOffset": { |
|
"scale": 0.08399864286184311, |
|
"offset": -128 |
|
} |
|
} |
|
} |
|
}, |
|
{ |
|
"version": "QNN_TENSOR_VERSION_1", |
|
"info": { |
|
"id": 16015, |
|
"name": "past_key_28_in", |
|
"type": "QNN_TENSOR_TYPE_APP_WRITE", |
|
"dataFormat": "QNN_TENSOR_DATA_FORMAT_FLAT_BUFFER", |
|
"dataType": "QNN_DATATYPE_UFIXED_POINT_8", |
|
"rank": 4, |
|
"dimensions": [ |
|
32, |
|
1, |
|
96, |
|
4095 |
|
], |
|
"memType": "QNN_TENSORMEMTYPE_MEMHANDLE", |
|
"quantizeParams": { |
|
"definition": "QNN_DEFINITION_DEFINED", |
|
"quantizationEncoding": "QNN_QUANTIZATION_ENCODING_SCALE_OFFSET", |
|
"scaleOffset": { |
|
"scale": 0.1828504055738449, |
|
"offset": -128 |
|
} |
|
} |
|
} |
|
}, |
|
{ |
|
"version": "QNN_TENSOR_VERSION_1", |
|
"info": { |
|
"id": 16018, |
|
"name": "past_value_28_in", |
|
"type": "QNN_TENSOR_TYPE_APP_WRITE", |
|
"dataFormat": "QNN_TENSOR_DATA_FORMAT_FLAT_BUFFER", |
|
"dataType": "QNN_DATATYPE_UFIXED_POINT_8", |
|
"rank": 4, |
|
"dimensions": [ |
|
32, |
|
1, |
|
4095, |
|
96 |
|
], |
|
"memType": "QNN_TENSORMEMTYPE_MEMHANDLE", |
|
"quantizeParams": { |
|
"definition": "QNN_DEFINITION_DEFINED", |
|
"quantizationEncoding": "QNN_QUANTIZATION_ENCODING_SCALE_OFFSET", |
|
"scaleOffset": { |
|
"scale": 0.09687352180480957, |
|
"offset": -128 |
|
} |
|
} |
|
} |
|
}, |
|
{ |
|
"version": "QNN_TENSOR_VERSION_1", |
|
"info": { |
|
"id": 16181, |
|
"name": "_model_layers_23_Add_1_Add_output_0", |
|
"type": "QNN_TENSOR_TYPE_APP_WRITE", |
|
"dataFormat": "QNN_TENSOR_DATA_FORMAT_FLAT_BUFFER", |
|
"dataType": "QNN_DATATYPE_UFIXED_POINT_16", |
|
"rank": 3, |
|
"dimensions": [ |
|
1, |
|
1, |
|
3072 |
|
], |
|
"memType": "QNN_TENSORMEMTYPE_MEMHANDLE", |
|
"quantizeParams": { |
|
"definition": "QNN_DEFINITION_DEFINED", |
|
"quantizationEncoding": "QNN_QUANTIZATION_ENCODING_SCALE_OFFSET", |
|
"scaleOffset": { |
|
"scale": 0.191017746925354, |
|
"offset": -41581 |
|
} |
|
} |
|
} |
|
}, |
|
{ |
|
"version": "QNN_TENSOR_VERSION_1", |
|
"info": { |
|
"id": 17086, |
|
"name": "position_ids_cos", |
|
"type": "QNN_TENSOR_TYPE_APP_WRITE", |
|
"dataFormat": "QNN_TENSOR_DATA_FORMAT_FLAT_BUFFER", |
|
"dataType": "QNN_DATATYPE_UFIXED_POINT_16", |
|
"rank": 4, |
|
"dimensions": [ |
|
1, |
|
1, |
|
1, |
|
48 |
|
], |
|
"memType": "QNN_TENSORMEMTYPE_MEMHANDLE", |
|
"quantizeParams": { |
|
"definition": "QNN_DEFINITION_DEFINED", |
|
"quantizationEncoding": "QNN_QUANTIZATION_ENCODING_SCALE_OFFSET", |
|
"scaleOffset": { |
|
"scale": 0.00003632373773143627, |
|
"offset": -32768 |
|
} |
|
} |
|
} |
|
}, |
|
{ |
|
"version": "QNN_TENSOR_VERSION_1", |
|
"info": { |
|
"id": 17088, |
|
"name": "position_ids_sin", |
|
"type": "QNN_TENSOR_TYPE_APP_WRITE", |
|
"dataFormat": "QNN_TENSOR_DATA_FORMAT_FLAT_BUFFER", |
|
"dataType": "QNN_DATATYPE_UFIXED_POINT_16", |
|
"rank": 4, |
|
"dimensions": [ |
|
1, |
|
1, |
|
1, |
|
48 |
|
], |
|
"memType": "QNN_TENSORMEMTYPE_MEMHANDLE", |
|
"quantizeParams": { |
|
"definition": "QNN_DEFINITION_DEFINED", |
|
"quantizationEncoding": "QNN_QUANTIZATION_ENCODING_SCALE_OFFSET", |
|
"scaleOffset": { |
|
"scale": 0.00003632373773143627, |
|
"offset": -32768 |
|
} |
|
} |
|
} |
|
}, |
|
{ |
|
"version": "QNN_TENSOR_VERSION_1", |
|
"info": { |
|
"id": 17793, |
|
"name": "attention_mask", |
|
"type": "QNN_TENSOR_TYPE_APP_WRITE", |
|
"dataFormat": "QNN_TENSOR_DATA_FORMAT_FLAT_BUFFER", |
|
"dataType": "QNN_DATATYPE_UFIXED_POINT_16", |
|
"rank": 4, |
|
"dimensions": [ |
|
1, |
|
1, |
|
1, |
|
4096 |
|
], |
|
"memType": "QNN_TENSORMEMTYPE_MEMHANDLE", |
|
"quantizeParams": { |
|
"definition": "QNN_DEFINITION_DEFINED", |
|
"quantizationEncoding": "QNN_QUANTIZATION_ENCODING_SCALE_OFFSET", |
|
"scaleOffset": { |
|
"scale": 0.0007629510946571827, |
|
"offset": -65535 |
|
} |
|
} |
|
} |
|
} |
|
], |
|
"numGraphOutputs": 17, |
|
"graphOutputs": [ |
|
{ |
|
"version": "QNN_TENSOR_VERSION_1", |
|
"info": { |
|
"id": 17053, |
|
"name": "past_value_24_out", |
|
"type": "QNN_TENSOR_TYPE_APP_READ", |
|
"dataFormat": "QNN_TENSOR_DATA_FORMAT_FLAT_BUFFER", |
|
"dataType": "QNN_DATATYPE_UFIXED_POINT_8", |
|
"rank": 4, |
|
"dimensions": [ |
|
32, |
|
1, |
|
1, |
|
96 |
|
], |
|
"memType": "QNN_TENSORMEMTYPE_MEMHANDLE", |
|
"quantizeParams": { |
|
"definition": "QNN_DEFINITION_DEFINED", |
|
"quantizationEncoding": "QNN_QUANTIZATION_ENCODING_SCALE_OFFSET", |
|
"scaleOffset": { |
|
"scale": 0.07847104221582413, |
|
"offset": -128 |
|
} |
|
} |
|
} |
|
}, |
|
{ |
|
"version": "QNN_TENSOR_VERSION_1", |
|
"info": { |
|
"id": 17696, |
|
"name": "past_key_24_out", |
|
"type": "QNN_TENSOR_TYPE_APP_READ", |
|
"dataFormat": "QNN_TENSOR_DATA_FORMAT_FLAT_BUFFER", |
|
"dataType": "QNN_DATATYPE_UFIXED_POINT_8", |
|
"rank": 4, |
|
"dimensions": [ |
|
32, |
|
1, |
|
96, |
|
1 |
|
], |
|
"memType": "QNN_TENSORMEMTYPE_MEMHANDLE", |
|
"quantizeParams": { |
|
"definition": "QNN_DEFINITION_DEFINED", |
|
"quantizationEncoding": "QNN_QUANTIZATION_ENCODING_SCALE_OFFSET", |
|
"scaleOffset": { |
|
"scale": 0.16835589706897736, |
|
"offset": -128 |
|
} |
|
} |
|
} |
|
}, |
|
{ |
|
"version": "QNN_TENSOR_VERSION_1", |
|
"info": { |
|
"id": 18816, |
|
"name": "past_value_25_out", |
|
"type": "QNN_TENSOR_TYPE_APP_READ", |
|
"dataFormat": "QNN_TENSOR_DATA_FORMAT_FLAT_BUFFER", |
|
"dataType": "QNN_DATATYPE_UFIXED_POINT_8", |
|
"rank": 4, |
|
"dimensions": [ |
|
32, |
|
1, |
|
1, |
|
96 |
|
], |
|
"memType": "QNN_TENSORMEMTYPE_MEMHANDLE", |
|
"quantizeParams": { |
|
"definition": "QNN_DEFINITION_DEFINED", |
|
"quantizationEncoding": "QNN_QUANTIZATION_ENCODING_SCALE_OFFSET", |
|
"scaleOffset": { |
|
"scale": 0.09766243398189545, |
|
"offset": -128 |
|
} |
|
} |
|
} |
|
}, |
|
{ |
|
"version": "QNN_TENSOR_VERSION_1", |
|
"info": { |
|
"id": 19457, |
|
"name": "past_key_25_out", |
|
"type": "QNN_TENSOR_TYPE_APP_READ", |
|
"dataFormat": "QNN_TENSOR_DATA_FORMAT_FLAT_BUFFER", |
|
"dataType": "QNN_DATATYPE_UFIXED_POINT_8", |
|
"rank": 4, |
|
"dimensions": [ |
|
32, |
|
1, |
|
96, |
|
1 |
|
], |
|
"memType": "QNN_TENSORMEMTYPE_MEMHANDLE", |
|
"quantizeParams": { |
|
"definition": "QNN_DEFINITION_DEFINED", |
|
"quantizationEncoding": "QNN_QUANTIZATION_ENCODING_SCALE_OFFSET", |
|
"scaleOffset": { |
|
"scale": 0.1846073865890503, |
|
"offset": -128 |
|
} |
|
} |
|
} |
|
}, |
|
{ |
|
"version": "QNN_TENSOR_VERSION_1", |
|
"info": { |
|
"id": 20576, |
|
"name": "past_value_26_out", |
|
"type": "QNN_TENSOR_TYPE_APP_READ", |
|
"dataFormat": "QNN_TENSOR_DATA_FORMAT_FLAT_BUFFER", |
|
"dataType": "QNN_DATATYPE_UFIXED_POINT_8", |
|
"rank": 4, |
|
"dimensions": [ |
|
32, |
|
1, |
|
1, |
|
96 |
|
], |
|
"memType": "QNN_TENSORMEMTYPE_MEMHANDLE", |
|
"quantizeParams": { |
|
"definition": "QNN_DEFINITION_DEFINED", |
|
"quantizationEncoding": "QNN_QUANTIZATION_ENCODING_SCALE_OFFSET", |
|
"scaleOffset": { |
|
"scale": 0.09959074854850769, |
|
"offset": -128 |
|
} |
|
} |
|
} |
|
}, |
|
{ |
|
"version": "QNN_TENSOR_VERSION_1", |
|
"info": { |
|
"id": 21217, |
|
"name": "past_key_26_out", |
|
"type": "QNN_TENSOR_TYPE_APP_READ", |
|
"dataFormat": "QNN_TENSOR_DATA_FORMAT_FLAT_BUFFER", |
|
"dataType": "QNN_DATATYPE_UFIXED_POINT_8", |
|
"rank": 4, |
|
"dimensions": [ |
|
32, |
|
1, |
|
96, |
|
1 |
|
], |
|
"memType": "QNN_TENSORMEMTYPE_MEMHANDLE", |
|
"quantizeParams": { |
|
"definition": "QNN_DEFINITION_DEFINED", |
|
"quantizationEncoding": "QNN_QUANTIZATION_ENCODING_SCALE_OFFSET", |
|
"scaleOffset": { |
|
"scale": 0.15839417278766633, |
|
"offset": -128 |
|
} |
|
} |
|
} |
|
}, |
|
{ |
|
"version": "QNN_TENSOR_VERSION_1", |
|
"info": { |
|
"id": 22336, |
|
"name": "past_value_27_out", |
|
"type": "QNN_TENSOR_TYPE_APP_READ", |
|
"dataFormat": "QNN_TENSOR_DATA_FORMAT_FLAT_BUFFER", |
|
"dataType": "QNN_DATATYPE_UFIXED_POINT_8", |
|
"rank": 4, |
|
"dimensions": [ |
|
32, |
|
1, |
|
1, |
|
96 |
|
], |
|
"memType": "QNN_TENSORMEMTYPE_MEMHANDLE", |
|
"quantizeParams": { |
|
"definition": "QNN_DEFINITION_DEFINED", |
|
"quantizationEncoding": "QNN_QUANTIZATION_ENCODING_SCALE_OFFSET", |
|
"scaleOffset": { |
|
"scale": 0.08399864286184311, |
|
"offset": -128 |
|
} |
|
} |
|
} |
|
}, |
|
{ |
|
"version": "QNN_TENSOR_VERSION_1", |
|
"info": { |
|
"id": 22977, |
|
"name": "past_key_27_out", |
|
"type": "QNN_TENSOR_TYPE_APP_READ", |
|
"dataFormat": "QNN_TENSOR_DATA_FORMAT_FLAT_BUFFER", |
|
"dataType": "QNN_DATATYPE_UFIXED_POINT_8", |
|
"rank": 4, |
|
"dimensions": [ |
|
32, |
|
1, |
|
96, |
|
1 |
|
], |
|
"memType": "QNN_TENSORMEMTYPE_MEMHANDLE", |
|
"quantizeParams": { |
|
"definition": "QNN_DEFINITION_DEFINED", |
|
"quantizationEncoding": "QNN_QUANTIZATION_ENCODING_SCALE_OFFSET", |
|
"scaleOffset": { |
|
"scale": 0.15847137570381165, |
|
"offset": -128 |
|
} |
|
} |
|
} |
|
}, |
|
{ |
|
"version": "QNN_TENSOR_VERSION_1", |
|
"info": { |
|
"id": 24096, |
|
"name": "past_value_28_out", |
|
"type": "QNN_TENSOR_TYPE_APP_READ", |
|
"dataFormat": "QNN_TENSOR_DATA_FORMAT_FLAT_BUFFER", |
|
"dataType": "QNN_DATATYPE_UFIXED_POINT_8", |
|
"rank": 4, |
|
"dimensions": [ |
|
32, |
|
1, |
|
1, |
|
96 |
|
], |
|
"memType": "QNN_TENSORMEMTYPE_MEMHANDLE", |
|
"quantizeParams": { |
|
"definition": "QNN_DEFINITION_DEFINED", |
|
"quantizationEncoding": "QNN_QUANTIZATION_ENCODING_SCALE_OFFSET", |
|
"scaleOffset": { |
|
"scale": 0.09687352180480957, |
|
"offset": -128 |
|
} |
|
} |
|
} |
|
}, |
|
{ |
|
"version": "QNN_TENSOR_VERSION_1", |
|
"info": { |
|
"id": 24737, |
|
"name": "past_key_28_out", |
|
"type": "QNN_TENSOR_TYPE_APP_READ", |
|
"dataFormat": "QNN_TENSOR_DATA_FORMAT_FLAT_BUFFER", |
|
"dataType": "QNN_DATATYPE_UFIXED_POINT_8", |
|
"rank": 4, |
|
"dimensions": [ |
|
32, |
|
1, |
|
96, |
|
1 |
|
], |
|
"memType": "QNN_TENSORMEMTYPE_MEMHANDLE", |
|
"quantizeParams": { |
|
"definition": "QNN_DEFINITION_DEFINED", |
|
"quantizationEncoding": "QNN_QUANTIZATION_ENCODING_SCALE_OFFSET", |
|
"scaleOffset": { |
|
"scale": 0.1828504055738449, |
|
"offset": -128 |
|
} |
|
} |
|
} |
|
}, |
|
{ |
|
"version": "QNN_TENSOR_VERSION_1", |
|
"info": { |
|
"id": 25856, |
|
"name": "past_value_29_out", |
|
"type": "QNN_TENSOR_TYPE_APP_READ", |
|
"dataFormat": "QNN_TENSOR_DATA_FORMAT_FLAT_BUFFER", |
|
"dataType": "QNN_DATATYPE_UFIXED_POINT_8", |
|
"rank": 4, |
|
"dimensions": [ |
|
32, |
|
1, |
|
1, |
|
96 |
|
], |
|
"memType": "QNN_TENSORMEMTYPE_MEMHANDLE", |
|
"quantizeParams": { |
|
"definition": "QNN_DEFINITION_DEFINED", |
|
"quantizationEncoding": "QNN_QUANTIZATION_ENCODING_SCALE_OFFSET", |
|
"scaleOffset": { |
|
"scale": 0.09825660288333893, |
|
"offset": -128 |
|
} |
|
} |
|
} |
|
}, |
|
{ |
|
"version": "QNN_TENSOR_VERSION_1", |
|
"info": { |
|
"id": 26497, |
|
"name": "past_key_29_out", |
|
"type": "QNN_TENSOR_TYPE_APP_READ", |
|
"dataFormat": "QNN_TENSOR_DATA_FORMAT_FLAT_BUFFER", |
|
"dataType": "QNN_DATATYPE_UFIXED_POINT_8", |
|
"rank": 4, |
|
"dimensions": [ |
|
32, |
|
1, |
|
96, |
|
1 |
|
], |
|
"memType": "QNN_TENSORMEMTYPE_MEMHANDLE", |
|
"quantizeParams": { |
|
"definition": "QNN_DEFINITION_DEFINED", |
|
"quantizationEncoding": "QNN_QUANTIZATION_ENCODING_SCALE_OFFSET", |
|
"scaleOffset": { |
|
"scale": 0.17043833434581757, |
|
"offset": -128 |
|
} |
|
} |
|
} |
|
}, |
|
{ |
|
"version": "QNN_TENSOR_VERSION_1", |
|
"info": { |
|
"id": 27616, |
|
"name": "past_value_30_out", |
|
"type": "QNN_TENSOR_TYPE_APP_READ", |
|
"dataFormat": "QNN_TENSOR_DATA_FORMAT_FLAT_BUFFER", |
|
"dataType": "QNN_DATATYPE_UFIXED_POINT_8", |
|
"rank": 4, |
|
"dimensions": [ |
|
32, |
|
1, |
|
1, |
|
96 |
|
], |
|
"memType": "QNN_TENSORMEMTYPE_MEMHANDLE", |
|
"quantizeParams": { |
|
"definition": "QNN_DEFINITION_DEFINED", |
|
"quantizationEncoding": "QNN_QUANTIZATION_ENCODING_SCALE_OFFSET", |
|
"scaleOffset": { |
|
"scale": 0.10411321371793747, |
|
"offset": -128 |
|
} |
|
} |
|
} |
|
}, |
|
{ |
|
"version": "QNN_TENSOR_VERSION_1", |
|
"info": { |
|
"id": 28257, |
|
"name": "past_key_30_out", |
|
"type": "QNN_TENSOR_TYPE_APP_READ", |
|
"dataFormat": "QNN_TENSOR_DATA_FORMAT_FLAT_BUFFER", |
|
"dataType": "QNN_DATATYPE_UFIXED_POINT_8", |
|
"rank": 4, |
|
"dimensions": [ |
|
32, |
|
1, |
|
96, |
|
1 |
|
], |
|
"memType": "QNN_TENSORMEMTYPE_MEMHANDLE", |
|
"quantizeParams": { |
|
"definition": "QNN_DEFINITION_DEFINED", |
|
"quantizationEncoding": "QNN_QUANTIZATION_ENCODING_SCALE_OFFSET", |
|
"scaleOffset": { |
|
"scale": 0.2074936181306839, |
|
"offset": -128 |
|
} |
|
} |
|
} |
|
}, |
|
{ |
|
"version": "QNN_TENSOR_VERSION_1", |
|
"info": { |
|
"id": 29376, |
|
"name": "past_value_31_out", |
|
"type": "QNN_TENSOR_TYPE_APP_READ", |
|
"dataFormat": "QNN_TENSOR_DATA_FORMAT_FLAT_BUFFER", |
|
"dataType": "QNN_DATATYPE_UFIXED_POINT_8", |
|
"rank": 4, |
|
"dimensions": [ |
|
32, |
|
1, |
|
1, |
|
96 |
|
], |
|
"memType": "QNN_TENSORMEMTYPE_MEMHANDLE", |
|
"quantizeParams": { |
|
"definition": "QNN_DEFINITION_DEFINED", |
|
"quantizationEncoding": "QNN_QUANTIZATION_ENCODING_SCALE_OFFSET", |
|
"scaleOffset": { |
|
"scale": 0.19053252041339875, |
|
"offset": -128 |
|
} |
|
} |
|
} |
|
}, |
|
{ |
|
"version": "QNN_TENSOR_VERSION_1", |
|
"info": { |
|
"id": 30017, |
|
"name": "past_key_31_out", |
|
"type": "QNN_TENSOR_TYPE_APP_READ", |
|
"dataFormat": "QNN_TENSOR_DATA_FORMAT_FLAT_BUFFER", |
|
"dataType": "QNN_DATATYPE_UFIXED_POINT_8", |
|
"rank": 4, |
|
"dimensions": [ |
|
32, |
|
1, |
|
96, |
|
1 |
|
], |
|
"memType": "QNN_TENSORMEMTYPE_MEMHANDLE", |
|
"quantizeParams": { |
|
"definition": "QNN_DEFINITION_DEFINED", |
|
"quantizationEncoding": "QNN_QUANTIZATION_ENCODING_SCALE_OFFSET", |
|
"scaleOffset": { |
|
"scale": 0.18935787677764893, |
|
"offset": -128 |
|
} |
|
} |
|
} |
|
}, |
|
{ |
|
"version": "QNN_TENSOR_VERSION_1", |
|
"info": { |
|
"id": 30280, |
|
"name": "logits", |
|
"type": "QNN_TENSOR_TYPE_APP_READ", |
|
"dataFormat": "QNN_TENSOR_DATA_FORMAT_FLAT_BUFFER", |
|
"dataType": "QNN_DATATYPE_UFIXED_POINT_16", |
|
"rank": 3, |
|
"dimensions": [ |
|
1, |
|
1, |
|
32064 |
|
], |
|
"memType": "QNN_TENSORMEMTYPE_MEMHANDLE", |
|
"quantizeParams": { |
|
"definition": "QNN_DEFINITION_DEFINED", |
|
"quantizationEncoding": "QNN_QUANTIZATION_ENCODING_SCALE_OFFSET", |
|
"scaleOffset": { |
|
"scale": 0.001873409142717719, |
|
"offset": -26111 |
|
} |
|
} |
|
} |
|
} |
|
], |
|
"numUpdateableTensors": 0, |
|
"updateableTensors": [], |
|
"graphBlobInfoSize": 40, |
|
"graphBlobInfo": [ |
|
{ |
|
"version": "QNN_SYSTEM_CONTEXT_HTP_GRAPH_INFO_BLOB_VERSION_V1", |
|
"info": { |
|
"spillFillBufferSize": 0, |
|
"optimizationLevel": 3, |
|
"vtcmSize": 8, |
|
"htpDlbc": 0, |
|
"numHvxThreads": 0 |
|
} |
|
} |
|
] |
|
} |
|
} |
|
], |
|
"contextMetadataSize": 8, |
|
"contextMetadata": { |
|
"version": "QNN_SYSTEM_CONTEXT_HTP_CONTEXT_INFO_BLOB_VERSION_V1", |
|
"info": { |
|
"dsp arch": 73 |
|
} |
|
}, |
|
"soc model": 43 |
|
} |
|
} |
|
|