@@ -27,52 +27,37 @@ namespace {
2727std::string GetSuitableCudaVersion (const std::string& engine,
2828 const std::string& cuda_driver_version) {
2929 auto suitable_toolkit_version = " " ;
30- if (engine == kTrtLlmRepo || engine == kTrtLlmEngine ) {
31- // for tensorrt-llm, we need to download cuda toolkit v12.4
32- suitable_toolkit_version = " 12.4" ;
33- } else {
34- // llamacpp
35- auto cuda_driver_semver =
36- semantic_version_utils::SplitVersion (cuda_driver_version);
37- if (cuda_driver_semver.major == 11 ) {
38- suitable_toolkit_version = " 11.7" ;
39- } else if (cuda_driver_semver.major == 12 ) {
40- suitable_toolkit_version = " 12.0" ;
41- }
30+
31+ // llamacpp
32+ auto cuda_driver_semver =
33+ semantic_version_utils::SplitVersion (cuda_driver_version);
34+ if (cuda_driver_semver.major == 11 ) {
35+ suitable_toolkit_version = " 11.7" ;
36+ } else if (cuda_driver_semver.major == 12 ) {
37+ suitable_toolkit_version = " 12.0" ;
4238 }
39+
4340 return suitable_toolkit_version;
4441}
4542
4643// Need to change this after we rename repositories
4744std::string NormalizeEngine (const std::string& engine) {
4845 if (engine == kLlamaEngine ) {
4946 return kLlamaRepo ;
50- } else if (engine == kOnnxEngine ) {
51- return kOnnxRepo ;
52- } else if (engine == kTrtLlmEngine ) {
53- return kTrtLlmRepo ;
5447 }
5548 return engine;
5649};
5750
5851std::string Repo2Engine (const std::string& r) {
5952 if (r == kLlamaRepo ) {
6053 return kLlamaEngine ;
61- } else if (r == kOnnxRepo ) {
62- return kOnnxEngine ;
63- } else if (r == kTrtLlmRepo ) {
64- return kTrtLlmEngine ;
6554 }
6655 return r;
6756};
6857
6958std::string GetEnginePath (std::string_view e) {
7059 if (e == kLlamaRepo ) {
7160 return kLlamaLibPath ;
72- } else if (e == kOnnxRepo ) {
73- return kOnnxLibPath ;
74- } else if (e == kTrtLlmRepo ) {
75- return kTensorrtLlmPath ;
7661 }
7762 return kLlamaLibPath ;
7863};
@@ -85,13 +70,6 @@ cpp::result<void, std::string> EngineService::InstallEngineAsync(
8570 CTL_INF (" InstallEngineAsync: " << ne << " , " << version << " , "
8671 << variant_name.value_or (" " ));
8772 auto os = hw_inf_.sys_inf ->os ;
88- if (os == kMacOs && (ne == kOnnxRepo || ne == kTrtLlmRepo )) {
89- return cpp::fail (" Engine " + ne + " is not supported on macOS" );
90- }
91-
92- if (os == kLinuxOs && ne == kOnnxRepo ) {
93- return cpp::fail (" Engine " + ne + " is not supported on Linux" );
94- }
9573
9674 auto result = DownloadEngine (ne, version, variant_name);
9775 if (result.has_error ()) {
@@ -386,9 +364,8 @@ cpp::result<void, std::string> EngineService::DownloadEngine(
386364
387365cpp::result<bool , std::string> EngineService::DownloadCuda (
388366 const std::string& engine, bool async) {
389- if (hw_inf_.sys_inf ->os == " mac" || engine == kOnnxRepo ||
390- engine == kOnnxEngine ) {
391- // mac and onnx engine does not require cuda toolkit
367+ if (hw_inf_.sys_inf ->os == " mac" ) {
368+ // mac does not require cuda toolkit
392369 return true ;
393370 }
394371
@@ -453,13 +430,7 @@ cpp::result<bool, std::string> EngineService::DownloadCuda(
453430std::string EngineService::GetMatchedVariant (
454431 const std::string& engine, const std::vector<std::string>& variants) {
455432 std::string matched_variant;
456- if (engine == kTrtLlmRepo || engine == kTrtLlmEngine ) {
457- matched_variant = engine_matcher_utils::ValidateTensorrtLlm (
458- variants, hw_inf_.sys_inf ->os , hw_inf_.cuda_driver_version );
459- } else if (engine == kOnnxRepo || engine == kOnnxEngine ) {
460- matched_variant = engine_matcher_utils::ValidateOnnx (
461- variants, hw_inf_.sys_inf ->os , hw_inf_.sys_inf ->arch );
462- } else if (engine == kLlamaRepo || engine == kLlamaEngine ) {
433+ if (engine == kLlamaRepo || engine == kLlamaEngine ) {
463434 auto suitable_avx =
464435 engine_matcher_utils::GetSuitableAvxVariant (hw_inf_.cpu_inf );
465436 matched_variant = engine_matcher_utils::Validate (
@@ -638,13 +609,6 @@ cpp::result<std::vector<EngineVariantResponse>, std::string>
638609EngineService::GetInstalledEngineVariants (const std::string& engine) const {
639610 auto ne = NormalizeEngine (engine);
640611 auto os = hw_inf_.sys_inf ->os ;
641- if (os == kMacOs && (ne == kOnnxRepo || ne == kTrtLlmRepo )) {
642- return cpp::fail (" Engine " + engine + " is not supported on macOS" );
643- }
644-
645- if (os == kLinuxOs && ne == kOnnxRepo ) {
646- return cpp::fail (" Engine " + engine + " is not supported on Linux" );
647- }
648612
649613 auto engines_variants_dir =
650614 file_manager_utils::GetEnginesContainerPath () / ne;
@@ -954,13 +918,7 @@ cpp::result<bool, std::string> EngineService::IsEngineReady(
954918 }
955919
956920 auto os = hw_inf_.sys_inf ->os ;
957- if (os == kMacOs && (ne == kOnnxRepo || ne == kTrtLlmRepo )) {
958- return cpp::fail (" Engine " + engine + " is not supported on macOS" );
959- }
960921
961- if (os == kLinuxOs && ne == kOnnxRepo ) {
962- return cpp::fail (" Engine " + engine + " is not supported on Linux" );
963- }
964922 auto installed_variants = GetInstalledEngineVariants (engine);
965923 if (installed_variants.has_error ()) {
966924 return cpp::fail (installed_variants.error ());
0 commit comments