createSession method

@override

Future<InferenceModelSession> createSession({

double temperature = 0.8,
int randomSeed = 1,
int topK = 1,
double? topP,
String? loraPath,
bool? enableVisionModality,

})

override

Creates a new InferenceModelSession for generation.

temperature, randomSeed, topK, topP — parameters for sampling. loraPath — optional path to LoRA model. enableVisionModality — enable vision modality for multimodal models.

Implementation

@override
Future<InferenceModelSession> createSession({
  double temperature = 0.8,
  int randomSeed = 1,
  int topK = 1,
  double? topP,
  String? loraPath,
  bool? enableVisionModality, // Enabling vision modality support
}) async {
  // TODO: Implement vision modality for web
  if (enableVisionModality == true) {
    if (kDebugMode) {
      print('Warning: Vision modality is not yet implemented for web platform');
    }
  }

  if (_initCompleter case Completer<InferenceModelSession> completer) {
    return completer.future;
  }
  final completer = _initCompleter = Completer<InferenceModelSession>();
  try {
    // Use Modern API to get model path (same as mobile)
    final activeModel = modelManager.activeInferenceModel;
    if (activeModel == null) {
      throw Exception('No active inference model set');
    }

    final modelFilePaths = await modelManager.getModelFilePaths(activeModel);
    if (modelFilePaths == null || modelFilePaths.isEmpty) {
      throw Exception('Model file paths not found');
    }

    // Get model path from Modern API
    final modelPath = modelFilePaths[PreferencesKeys.installedModelFileName];
    if (modelPath == null) {
      throw Exception('Model path not found in file paths');
    }

    final fileset = await FilesetResolver.forGenAiTasks('https://cdn.jsdelivr.net/npm/@mediapipe/tasks-genai@latest/wasm'.toJS).toDart;

    // Get LoRA path if available
    final loraPathToUse = loraPath ?? modelFilePaths[PreferencesKeys.installedLoraFileName];
    final hasLoraParams = loraPathToUse != null && loraRanks != null;

    final config = LlmInferenceOptions(
      baseOptions: LlmInferenceBaseOptions(modelAssetPath: modelPath),
      maxTokens: maxTokens,
      randomSeed: randomSeed,
      topK: topK,
      temperature: temperature,
      topP: topP,
      supportedLoraRanks: !hasLoraParams ? null : Int32List.fromList(loraRanks!).toJS,
      loraPath: !hasLoraParams ? null : loraPathToUse,
      maxNumImages: supportImage ? (maxNumImages ?? 1) : null
    );

    final llmInference = await LlmInference.createFromOptions(fileset, config).toDart;

    final session = this.session = WebModelSession(
      modelType: modelType,
      fileType: fileType,
      llmInference: llmInference,
      supportImage: supportImage, // Enabling image support
      onClose: onClose,
    );
    completer.complete(session);
    return session;
  } catch (e) {
    throw Exception("Failed to create session: $e");
  }
}

createSession method

Implementation

WebInferenceModel class