Search Options

Results per page
Sort
Preferred Languages
Advance

Results 1 - 8 of 8 for weight_only (0.15 sec)

  1. tensorflow/compiler/mlir/quantization/tensorflow/tests/preprocess_op_weight_only.mlir

    // RUN: tf-quant-opt %s -split-input-file -quant-preprocess-op='target-opset=XLA quantization-method=weight_only enable-per-channel-quantization=false' | FileCheck --check-prefix PerTensor %s
    // RUN: tf-quant-opt %s -split-input-file -quant-preprocess-op='target-opset=XLA quantization-method=weight_only enable-per-channel-quantization=true' | FileCheck --check-prefix PerChannel %s
    
    module {
      // For XLA weight-only per-channel depthwise convolution, tensor shape should have
    Registered: Sun Jun 16 05:45:23 UTC 2024
    - Last Modified: Mon Oct 30 06:52:55 UTC 2023
    - 4.7K bytes
    - Viewed (0)
  2. tensorflow/compiler/mlir/quantization/tensorflow/tests/insert_quantized_functions_weight_only.mlir

    // RUN: tf-quant-opt %s -quant-insert-quantized-functions='quantization-method=weight_only target-opset=XLA' | FileCheck %s
    
    // Empty module
    module {
      func.func @simple_fn(%arg0: tensor<*xf32>) -> tensor<*xf32> {
        func.return %arg0 : tensor<*xf32>
      }
    }
    
    // CHECK-NOT: func private @internal_dequantize_f32
    // CHECK-NOT: func private @internal_conv3d_fn
    // CHECK-NOT: func private @internal_batch_matmul_fn
    Registered: Sun Jun 16 05:45:23 UTC 2024
    - Last Modified: Thu Feb 16 03:34:36 UTC 2023
    - 843 bytes
    - Viewed (0)
  3. tensorflow/compiler/mlir/quantization/tensorflow/passes/lift_quantizable_spots_as_functions_drq.cc

              clEnumValN(tensorflow::quantization::QuantizationMethod::
                             METHOD_STATIC_RANGE_WEIGHT_ONLY_INT8,
                         "weight_only", "Post-training weight_only quantizaiton"))};
    };
    
    class CheckQuantizableOps
        : public mlir::OpRewritePattern<TF::PartitionedCallOp> {
     public:
      explicit CheckQuantizableOps(MLIRContext* context,
    Registered: Sun Jun 16 05:45:23 UTC 2024
    - Last Modified: Thu Apr 25 16:01:03 UTC 2024
    - 8.5K bytes
    - Viewed (0)
  4. tensorflow/compiler/mlir/quantization/tensorflow/passes/insert_quantized_functions.cc

              clEnumValN(tensorflow::quantization::QuantizationMethod::
                             METHOD_STATIC_RANGE_WEIGHT_ONLY_INT8,
                         "weight_only", "Post-training weight_only quantizaiton"))};
    
      Option<OpSet> op_set_{
          *this, "target-opset", llvm::cl::init(OpSet::TF),
          llvm::cl::desc("Choose target opset."),
          llvm::cl::values(
    Registered: Sun Jun 16 05:45:23 UTC 2024
    - Last Modified: Fri Mar 22 05:52:39 UTC 2024
    - 8.7K bytes
    - Viewed (0)
  5. tensorflow/compiler/mlir/quantization/stablehlo/utils/fill_quantization_options.cc

          break;
        // Note: This is weight-only quantization by default, but with the legacy
        // flag "--force_dynamic_range_in_kernel", a DRQ behavior will be forced
        // in the kernel.
        case PresetQuantizationMethod::WEIGHT_ONLY:
          weight_component = custom_method.add_quantization_component_spec();
          SetQuantizationComponentSpec(weight_component,
                                       QuantizationComponentSpec::COMPONENT_WEIGHT,
    Registered: Sun Jun 16 05:45:23 UTC 2024
    - Last Modified: Tue Mar 05 08:32:43 UTC 2024
    - 6.2K bytes
    - Viewed (0)
  6. tensorflow/compiler/mlir/quantization/stablehlo/quantization_options.proto

        // Apply default weight-only quantization. Weights are quantized during
        // conversion, then dequantized during inference.
        // Activation: f32, Weight: qi8, Bias: f32
        WEIGHT_ONLY = 1;
    
        // Apply default dynamic range quantization. Quantized tensor value's
        // ranges are determined during graph runtime.
        // Activation: f32, Weight: qi8, Bias: f32
    Registered: Sun Jun 16 05:45:23 UTC 2024
    - Last Modified: Thu Jun 22 02:20:05 UTC 2023
    - 3.6K bytes
    - Viewed (0)
  7. tensorflow/compiler/mlir/quantization/tensorflow/quantization_options.proto

      // is:
      // 1) STATIC_RANGE
      //    - COMPONENT_ACTIVATION: INT_8
      //    - COMPONENT_WEIGHT: INT_8
      //    - COMPONENT_BIAS: INT_32
      // 2) WEIGHT_ONLY
      //    - COMPONENT_WEIGHT: INT_8
      // 3) DYNAMIC_RANGE
      //    - COMPONENT_ACTIVATION: INT_8
      //    - COMPONENT_WEIGHT: INT_8
      //    - COMPONENT_BIAS: INT_32
    Registered: Sun Jun 16 05:45:23 UTC 2024
    - Last Modified: Tue Mar 19 06:31:19 UTC 2024
    - 9.2K bytes
    - Viewed (0)
  8. tensorflow/compiler/mlir/quantization/common/quantization_lib/quantization_config.cc

              custom_op_map[node_name].quantizable_input_indices.push_back(
                  std::stoi(cur_index));
            }
            break;
          }
          case CustomOpUpdateOptions::kWeightOnly:
            custom_op_map[node_name].is_weight_only =
                GetBooleanSpecs(node_specification);
            break;
          case CustomOpUpdateOptions::kNoSideEffect:
            custom_op_map[node_name].no_side_effect =
    Registered: Sun Jun 16 05:45:23 UTC 2024
    - Last Modified: Tue Mar 05 07:39:40 UTC 2024
    - 5.9K bytes
    - Viewed (0)
Back to top