|
|
@ -84,10 +84,6 @@ bool EmbeddingLLMWorker::loadModel()
|
|
|
|
return false;
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
// FIXME(jared): the user may want this to take effect without having to restart
|
|
|
|
|
|
|
|
int n_threads = MySettings::globalInstance()->threadCount();
|
|
|
|
|
|
|
|
m_model->setThreadCount(n_threads);
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
// NOTE: explicitly loads model on CPU to avoid GPU OOM
|
|
|
|
// NOTE: explicitly loads model on CPU to avoid GPU OOM
|
|
|
|
// TODO(cebtenzzre): support GPU-accelerated embeddings
|
|
|
|
// TODO(cebtenzzre): support GPU-accelerated embeddings
|
|
|
|
bool success = m_model->loadModel(filePath.toStdString(), 2048, 0);
|
|
|
|
bool success = m_model->loadModel(filePath.toStdString(), 2048, 0);
|
|
|
@ -104,6 +100,11 @@ bool EmbeddingLLMWorker::loadModel()
|
|
|
|
m_model = nullptr;
|
|
|
|
m_model = nullptr;
|
|
|
|
return false;
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
// FIXME(jared): the user may want this to take effect without having to restart
|
|
|
|
|
|
|
|
int n_threads = MySettings::globalInstance()->threadCount();
|
|
|
|
|
|
|
|
m_model->setThreadCount(n_threads);
|
|
|
|
|
|
|
|
|
|
|
|
return true;
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|