llama-stack 0.4.2__py3-none-any.whl → 0.4.4__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (182) hide show
  1. llama_stack/core/library_client.py +80 -3
  2. llama_stack/core/routing_tables/common.py +11 -0
  3. llama_stack/core/routing_tables/vector_stores.py +4 -0
  4. llama_stack/core/stack.py +16 -1
  5. llama_stack/core/storage/kvstore/kvstore.py +11 -0
  6. llama_stack/core/storage/kvstore/mongodb/mongodb.py +5 -0
  7. llama_stack/core/storage/kvstore/postgres/postgres.py +8 -0
  8. llama_stack/core/storage/kvstore/redis/redis.py +5 -0
  9. llama_stack/core/storage/sqlstore/sqlalchemy_sqlstore.py +8 -0
  10. llama_stack/core/storage/sqlstore/sqlstore.py +8 -0
  11. llama_stack/distributions/dell/doc_template.md +209 -0
  12. llama_stack/distributions/meta-reference-gpu/doc_template.md +119 -0
  13. llama_stack/distributions/nvidia/doc_template.md +170 -0
  14. llama_stack/distributions/oci/doc_template.md +140 -0
  15. llama_stack/models/llama/llama3/dog.jpg +0 -0
  16. llama_stack/models/llama/llama3/pasta.jpeg +0 -0
  17. llama_stack/models/llama/resources/dog.jpg +0 -0
  18. llama_stack/models/llama/resources/pasta.jpeg +0 -0
  19. llama_stack/models/llama/resources/small_dog.jpg +0 -0
  20. llama_stack/providers/inline/agents/meta_reference/responses/openai_responses.py +184 -33
  21. llama_stack/providers/inline/agents/meta_reference/responses/streaming.py +4 -0
  22. llama_stack/providers/inline/agents/meta_reference/responses/tool_executor.py +9 -1
  23. llama_stack/providers/inline/ios/inference/LocalInferenceImpl/LocalInference.h +9 -0
  24. llama_stack/providers/inline/ios/inference/LocalInferenceImpl/LocalInference.swift +189 -0
  25. llama_stack/providers/inline/ios/inference/LocalInferenceImpl/Parsing.swift +238 -0
  26. llama_stack/providers/inline/ios/inference/LocalInferenceImpl/PromptTemplate.swift +12 -0
  27. llama_stack/providers/inline/ios/inference/LocalInferenceImpl/SystemPrompts.swift +89 -0
  28. llama_stack/providers/inline/ios/inference/LocalInferenceImpl.xcodeproj/project.pbxproj +550 -0
  29. llama_stack/providers/inline/ios/inference/LocalInferenceImpl.xcodeproj/project.xcworkspace/contents.xcworkspacedata +7 -0
  30. llama_stack/providers/inline/ios/inference/LocalInferenceImpl.xcodeproj/project.xcworkspace/xcshareddata/IDEWorkspaceChecks.plist +8 -0
  31. llama_stack/providers/remote/datasetio/nvidia/README.md +74 -0
  32. llama_stack/providers/remote/eval/nvidia/README.md +134 -0
  33. llama_stack/providers/remote/files/s3/README.md +266 -0
  34. llama_stack/providers/remote/inference/nvidia/NVIDIA.md +203 -0
  35. llama_stack/providers/remote/post_training/nvidia/README.md +151 -0
  36. llama_stack/providers/remote/safety/nvidia/README.md +78 -0
  37. llama_stack/providers/remote/vector_io/pgvector/pgvector.py +13 -1
  38. llama_stack/providers/utils/inference/embedding_mixin.py +20 -16
  39. llama_stack/providers/utils/memory/openai_vector_store_mixin.py +33 -0
  40. llama_stack/providers/utils/responses/responses_store.py +34 -0
  41. llama_stack/providers/utils/tools/mcp.py +258 -16
  42. {llama_stack-0.4.2.dist-info → llama_stack-0.4.4.dist-info}/METADATA +2 -2
  43. {llama_stack-0.4.2.dist-info → llama_stack-0.4.4.dist-info}/RECORD +47 -158
  44. {llama_stack-0.4.2.dist-info → llama_stack-0.4.4.dist-info}/WHEEL +1 -1
  45. llama_stack-0.4.4.dist-info/top_level.txt +1 -0
  46. llama_stack-0.4.2.dist-info/top_level.txt +0 -2
  47. llama_stack_api/__init__.py +0 -945
  48. llama_stack_api/admin/__init__.py +0 -45
  49. llama_stack_api/admin/api.py +0 -72
  50. llama_stack_api/admin/fastapi_routes.py +0 -117
  51. llama_stack_api/admin/models.py +0 -113
  52. llama_stack_api/agents.py +0 -173
  53. llama_stack_api/batches/__init__.py +0 -40
  54. llama_stack_api/batches/api.py +0 -53
  55. llama_stack_api/batches/fastapi_routes.py +0 -113
  56. llama_stack_api/batches/models.py +0 -78
  57. llama_stack_api/benchmarks/__init__.py +0 -43
  58. llama_stack_api/benchmarks/api.py +0 -39
  59. llama_stack_api/benchmarks/fastapi_routes.py +0 -109
  60. llama_stack_api/benchmarks/models.py +0 -109
  61. llama_stack_api/common/__init__.py +0 -5
  62. llama_stack_api/common/content_types.py +0 -101
  63. llama_stack_api/common/errors.py +0 -95
  64. llama_stack_api/common/job_types.py +0 -38
  65. llama_stack_api/common/responses.py +0 -77
  66. llama_stack_api/common/training_types.py +0 -47
  67. llama_stack_api/common/type_system.py +0 -146
  68. llama_stack_api/connectors.py +0 -146
  69. llama_stack_api/conversations.py +0 -270
  70. llama_stack_api/datasetio.py +0 -55
  71. llama_stack_api/datasets/__init__.py +0 -61
  72. llama_stack_api/datasets/api.py +0 -35
  73. llama_stack_api/datasets/fastapi_routes.py +0 -104
  74. llama_stack_api/datasets/models.py +0 -152
  75. llama_stack_api/datatypes.py +0 -373
  76. llama_stack_api/eval.py +0 -137
  77. llama_stack_api/file_processors/__init__.py +0 -27
  78. llama_stack_api/file_processors/api.py +0 -64
  79. llama_stack_api/file_processors/fastapi_routes.py +0 -78
  80. llama_stack_api/file_processors/models.py +0 -42
  81. llama_stack_api/files/__init__.py +0 -35
  82. llama_stack_api/files/api.py +0 -51
  83. llama_stack_api/files/fastapi_routes.py +0 -124
  84. llama_stack_api/files/models.py +0 -107
  85. llama_stack_api/inference.py +0 -1169
  86. llama_stack_api/inspect_api/__init__.py +0 -37
  87. llama_stack_api/inspect_api/api.py +0 -25
  88. llama_stack_api/inspect_api/fastapi_routes.py +0 -76
  89. llama_stack_api/inspect_api/models.py +0 -28
  90. llama_stack_api/internal/__init__.py +0 -9
  91. llama_stack_api/internal/kvstore.py +0 -26
  92. llama_stack_api/internal/sqlstore.py +0 -79
  93. llama_stack_api/llama_stack_api/__init__.py +0 -945
  94. llama_stack_api/llama_stack_api/admin/__init__.py +0 -45
  95. llama_stack_api/llama_stack_api/admin/api.py +0 -72
  96. llama_stack_api/llama_stack_api/admin/fastapi_routes.py +0 -117
  97. llama_stack_api/llama_stack_api/admin/models.py +0 -113
  98. llama_stack_api/llama_stack_api/agents.py +0 -173
  99. llama_stack_api/llama_stack_api/batches/__init__.py +0 -40
  100. llama_stack_api/llama_stack_api/batches/api.py +0 -53
  101. llama_stack_api/llama_stack_api/batches/fastapi_routes.py +0 -113
  102. llama_stack_api/llama_stack_api/batches/models.py +0 -78
  103. llama_stack_api/llama_stack_api/benchmarks/__init__.py +0 -43
  104. llama_stack_api/llama_stack_api/benchmarks/api.py +0 -39
  105. llama_stack_api/llama_stack_api/benchmarks/fastapi_routes.py +0 -109
  106. llama_stack_api/llama_stack_api/benchmarks/models.py +0 -109
  107. llama_stack_api/llama_stack_api/common/__init__.py +0 -5
  108. llama_stack_api/llama_stack_api/common/content_types.py +0 -101
  109. llama_stack_api/llama_stack_api/common/errors.py +0 -95
  110. llama_stack_api/llama_stack_api/common/job_types.py +0 -38
  111. llama_stack_api/llama_stack_api/common/responses.py +0 -77
  112. llama_stack_api/llama_stack_api/common/training_types.py +0 -47
  113. llama_stack_api/llama_stack_api/common/type_system.py +0 -146
  114. llama_stack_api/llama_stack_api/connectors.py +0 -146
  115. llama_stack_api/llama_stack_api/conversations.py +0 -270
  116. llama_stack_api/llama_stack_api/datasetio.py +0 -55
  117. llama_stack_api/llama_stack_api/datasets/__init__.py +0 -61
  118. llama_stack_api/llama_stack_api/datasets/api.py +0 -35
  119. llama_stack_api/llama_stack_api/datasets/fastapi_routes.py +0 -104
  120. llama_stack_api/llama_stack_api/datasets/models.py +0 -152
  121. llama_stack_api/llama_stack_api/datatypes.py +0 -373
  122. llama_stack_api/llama_stack_api/eval.py +0 -137
  123. llama_stack_api/llama_stack_api/file_processors/__init__.py +0 -27
  124. llama_stack_api/llama_stack_api/file_processors/api.py +0 -64
  125. llama_stack_api/llama_stack_api/file_processors/fastapi_routes.py +0 -78
  126. llama_stack_api/llama_stack_api/file_processors/models.py +0 -42
  127. llama_stack_api/llama_stack_api/files/__init__.py +0 -35
  128. llama_stack_api/llama_stack_api/files/api.py +0 -51
  129. llama_stack_api/llama_stack_api/files/fastapi_routes.py +0 -124
  130. llama_stack_api/llama_stack_api/files/models.py +0 -107
  131. llama_stack_api/llama_stack_api/inference.py +0 -1169
  132. llama_stack_api/llama_stack_api/inspect_api/__init__.py +0 -37
  133. llama_stack_api/llama_stack_api/inspect_api/api.py +0 -25
  134. llama_stack_api/llama_stack_api/inspect_api/fastapi_routes.py +0 -76
  135. llama_stack_api/llama_stack_api/inspect_api/models.py +0 -28
  136. llama_stack_api/llama_stack_api/internal/__init__.py +0 -9
  137. llama_stack_api/llama_stack_api/internal/kvstore.py +0 -26
  138. llama_stack_api/llama_stack_api/internal/sqlstore.py +0 -79
  139. llama_stack_api/llama_stack_api/models.py +0 -171
  140. llama_stack_api/llama_stack_api/openai_responses.py +0 -1468
  141. llama_stack_api/llama_stack_api/post_training.py +0 -370
  142. llama_stack_api/llama_stack_api/prompts.py +0 -203
  143. llama_stack_api/llama_stack_api/providers/__init__.py +0 -33
  144. llama_stack_api/llama_stack_api/providers/api.py +0 -16
  145. llama_stack_api/llama_stack_api/providers/fastapi_routes.py +0 -57
  146. llama_stack_api/llama_stack_api/providers/models.py +0 -24
  147. llama_stack_api/llama_stack_api/py.typed +0 -0
  148. llama_stack_api/llama_stack_api/rag_tool.py +0 -168
  149. llama_stack_api/llama_stack_api/resource.py +0 -37
  150. llama_stack_api/llama_stack_api/router_utils.py +0 -160
  151. llama_stack_api/llama_stack_api/safety.py +0 -132
  152. llama_stack_api/llama_stack_api/schema_utils.py +0 -208
  153. llama_stack_api/llama_stack_api/scoring.py +0 -93
  154. llama_stack_api/llama_stack_api/scoring_functions.py +0 -211
  155. llama_stack_api/llama_stack_api/shields.py +0 -93
  156. llama_stack_api/llama_stack_api/tools.py +0 -226
  157. llama_stack_api/llama_stack_api/vector_io.py +0 -941
  158. llama_stack_api/llama_stack_api/vector_stores.py +0 -51
  159. llama_stack_api/llama_stack_api/version.py +0 -9
  160. llama_stack_api/models.py +0 -171
  161. llama_stack_api/openai_responses.py +0 -1468
  162. llama_stack_api/post_training.py +0 -370
  163. llama_stack_api/prompts.py +0 -203
  164. llama_stack_api/providers/__init__.py +0 -33
  165. llama_stack_api/providers/api.py +0 -16
  166. llama_stack_api/providers/fastapi_routes.py +0 -57
  167. llama_stack_api/providers/models.py +0 -24
  168. llama_stack_api/py.typed +0 -0
  169. llama_stack_api/rag_tool.py +0 -168
  170. llama_stack_api/resource.py +0 -37
  171. llama_stack_api/router_utils.py +0 -160
  172. llama_stack_api/safety.py +0 -132
  173. llama_stack_api/schema_utils.py +0 -208
  174. llama_stack_api/scoring.py +0 -93
  175. llama_stack_api/scoring_functions.py +0 -211
  176. llama_stack_api/shields.py +0 -93
  177. llama_stack_api/tools.py +0 -226
  178. llama_stack_api/vector_io.py +0 -941
  179. llama_stack_api/vector_stores.py +0 -51
  180. llama_stack_api/version.py +0 -9
  181. {llama_stack-0.4.2.dist-info → llama_stack-0.4.4.dist-info}/entry_points.txt +0 -0
  182. {llama_stack-0.4.2.dist-info → llama_stack-0.4.4.dist-info}/licenses/LICENSE +0 -0
@@ -0,0 +1,550 @@
1
+ // !$*UTF8*$!
2
+ {
3
+ archiveVersion = 1;
4
+ classes = {
5
+ };
6
+ objectVersion = 56;
7
+ objects = {
8
+
9
+ /* Begin PBXBuildFile section */
10
+ 5CADC71A2CA471CC007662D2 /* LlamaStackClient in Frameworks */ = {isa = PBXBuildFile; productRef = 5CADC7192CA471CC007662D2 /* LlamaStackClient */; };
11
+ 5CAF3DD82CA485740029CD2B /* LlamaStackClient in Frameworks */ = {isa = PBXBuildFile; productRef = 5CAF3DD72CA485740029CD2B /* LlamaStackClient */; };
12
+ 5CCBC60C2CA1F04A00E958D0 /* LocalInference.h in Headers */ = {isa = PBXBuildFile; fileRef = 5CCBC60B2CA1F04A00E958D0 /* LocalInference.h */; settings = {ATTRIBUTES = (Public, ); }; };
13
+ 5CCBC6752CA1F45800E958D0 /* executorch_debug in Frameworks */ = {isa = PBXBuildFile; productRef = 5CCBC6742CA1F45800E958D0 /* executorch_debug */; };
14
+ 5CCBC6862CA1F64A00E958D0 /* LLaMARunner.framework in Frameworks */ = {isa = PBXBuildFile; fileRef = 5CCBC6802CA1F63F00E958D0 /* LLaMARunner.framework */; platformFilter = ios; };
15
+ 5CCBC6872CA1F64A00E958D0 /* LLaMARunner.framework in Embed Frameworks */ = {isa = PBXBuildFile; fileRef = 5CCBC6802CA1F63F00E958D0 /* LLaMARunner.framework */; platformFilter = ios; settings = {ATTRIBUTES = (CodeSignOnCopy, RemoveHeadersOnCopy, ); }; };
16
+ 5CCBC68D2CA1F7A100E958D0 /* PromptTemplate.swift in Sources */ = {isa = PBXBuildFile; fileRef = 5CCBC6892CA1F7A000E958D0 /* PromptTemplate.swift */; };
17
+ 5CCBC68E2CA1F7A100E958D0 /* LocalInference.swift in Sources */ = {isa = PBXBuildFile; fileRef = 5CCBC68A2CA1F7A000E958D0 /* LocalInference.swift */; };
18
+ 5CCBC68F2CA1F7A100E958D0 /* Parsing.swift in Sources */ = {isa = PBXBuildFile; fileRef = 5CCBC68B2CA1F7A000E958D0 /* Parsing.swift */; };
19
+ 5CCBC6902CA1F7A100E958D0 /* SystemPrompts.swift in Sources */ = {isa = PBXBuildFile; fileRef = 5CCBC68C2CA1F7A100E958D0 /* SystemPrompts.swift */; };
20
+ 5CCBC6932CA1F7D000E958D0 /* Stencil in Frameworks */ = {isa = PBXBuildFile; productRef = 5CCBC6922CA1F7D000E958D0 /* Stencil */; };
21
+ /* End PBXBuildFile section */
22
+
23
+ /* Begin PBXContainerItemProxy section */
24
+ 5CCBC67D2CA1F63F00E958D0 /* PBXContainerItemProxy */ = {
25
+ isa = PBXContainerItemProxy;
26
+ containerPortal = 5CCBC6762CA1F63F00E958D0 /* LLaMA.xcodeproj */;
27
+ proxyType = 2;
28
+ remoteGlobalIDString = 036CAF9D2BB1444500D6C2D5;
29
+ remoteInfo = LLaMA;
30
+ };
31
+ 5CCBC67F2CA1F63F00E958D0 /* PBXContainerItemProxy */ = {
32
+ isa = PBXContainerItemProxy;
33
+ containerPortal = 5CCBC6762CA1F63F00E958D0 /* LLaMA.xcodeproj */;
34
+ proxyType = 2;
35
+ remoteGlobalIDString = 03729ED52BB1F8DE00152F2E;
36
+ remoteInfo = LLaMARunner;
37
+ };
38
+ 5CCBC69E2CA2036B00E958D0 /* PBXContainerItemProxy */ = {
39
+ isa = PBXContainerItemProxy;
40
+ containerPortal = 5CCBC6762CA1F63F00E958D0 /* LLaMA.xcodeproj */;
41
+ proxyType = 2;
42
+ remoteGlobalIDString = 5CCBC6982CA2036A00E958D0;
43
+ remoteInfo = LLaMAPerfBenchmark;
44
+ };
45
+ 5CCBC6A02CA2036B00E958D0 /* PBXContainerItemProxy */ = {
46
+ isa = PBXContainerItemProxy;
47
+ containerPortal = 5CCBC6762CA1F63F00E958D0 /* LLaMA.xcodeproj */;
48
+ proxyType = 2;
49
+ remoteGlobalIDString = 5CCBC6992CA2036A00E958D0;
50
+ remoteInfo = LLaMAPerfBenchmarkTests;
51
+ };
52
+ /* End PBXContainerItemProxy section */
53
+
54
+ /* Begin PBXCopyFilesBuildPhase section */
55
+ 5CCBC6882CA1F64A00E958D0 /* Embed Frameworks */ = {
56
+ isa = PBXCopyFilesBuildPhase;
57
+ buildActionMask = 2147483647;
58
+ dstPath = "";
59
+ dstSubfolderSpec = 10;
60
+ files = (
61
+ 5CCBC6872CA1F64A00E958D0 /* LLaMARunner.framework in Embed Frameworks */,
62
+ );
63
+ name = "Embed Frameworks";
64
+ runOnlyForDeploymentPostprocessing = 0;
65
+ };
66
+ /* End PBXCopyFilesBuildPhase section */
67
+
68
+ /* Begin PBXFileReference section */
69
+ 5CCBC6082CA1F04A00E958D0 /* LocalInferenceImpl.framework */ = {isa = PBXFileReference; explicitFileType = wrapper.framework; includeInIndex = 0; path = LocalInferenceImpl.framework; sourceTree = BUILT_PRODUCTS_DIR; };
70
+ 5CCBC60B2CA1F04A00E958D0 /* LocalInference.h */ = {isa = PBXFileReference; lastKnownFileType = sourcecode.c.h; path = LocalInference.h; sourceTree = "<group>"; };
71
+ 5CCBC6762CA1F63F00E958D0 /* LLaMA.xcodeproj */ = {isa = PBXFileReference; lastKnownFileType = "wrapper.pb-project"; name = LLaMA.xcodeproj; path = "executorch/examples/demo-apps/apple_ios/LLaMA/LLaMA.xcodeproj"; sourceTree = "<group>"; };
72
+ 5CCBC6892CA1F7A000E958D0 /* PromptTemplate.swift */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.swift; path = PromptTemplate.swift; sourceTree = "<group>"; };
73
+ 5CCBC68A2CA1F7A000E958D0 /* LocalInference.swift */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.swift; path = LocalInference.swift; sourceTree = "<group>"; };
74
+ 5CCBC68B2CA1F7A000E958D0 /* Parsing.swift */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.swift; path = Parsing.swift; sourceTree = "<group>"; };
75
+ 5CCBC68C2CA1F7A100E958D0 /* SystemPrompts.swift */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.swift; path = SystemPrompts.swift; sourceTree = "<group>"; };
76
+ /* End PBXFileReference section */
77
+
78
+ /* Begin PBXFrameworksBuildPhase section */
79
+ 5CCBC6052CA1F04A00E958D0 /* Frameworks */ = {
80
+ isa = PBXFrameworksBuildPhase;
81
+ buildActionMask = 2147483647;
82
+ files = (
83
+ 5CADC71A2CA471CC007662D2 /* LlamaStackClient in Frameworks */,
84
+ 5CAF3DD82CA485740029CD2B /* LlamaStackClient in Frameworks */,
85
+ 5CCBC6932CA1F7D000E958D0 /* Stencil in Frameworks */,
86
+ 5CCBC6862CA1F64A00E958D0 /* LLaMARunner.framework in Frameworks */,
87
+ 5CCBC6752CA1F45800E958D0 /* executorch_debug in Frameworks */,
88
+ );
89
+ runOnlyForDeploymentPostprocessing = 0;
90
+ };
91
+ /* End PBXFrameworksBuildPhase section */
92
+
93
+ /* Begin PBXGroup section */
94
+ 5CCBC5FE2CA1F04A00E958D0 = {
95
+ isa = PBXGroup;
96
+ children = (
97
+ 5CCBC6762CA1F63F00E958D0 /* LLaMA.xcodeproj */,
98
+ 5CCBC60A2CA1F04A00E958D0 /* LocalInferenceImpl */,
99
+ 5CCBC6092CA1F04A00E958D0 /* Products */,
100
+ 5CCBC6852CA1F64A00E958D0 /* Frameworks */,
101
+ );
102
+ sourceTree = "<group>";
103
+ };
104
+ 5CCBC6092CA1F04A00E958D0 /* Products */ = {
105
+ isa = PBXGroup;
106
+ children = (
107
+ 5CCBC6082CA1F04A00E958D0 /* LocalInferenceImpl.framework */,
108
+ );
109
+ name = Products;
110
+ sourceTree = "<group>";
111
+ };
112
+ 5CCBC60A2CA1F04A00E958D0 /* LocalInferenceImpl */ = {
113
+ isa = PBXGroup;
114
+ children = (
115
+ 5CCBC68A2CA1F7A000E958D0 /* LocalInference.swift */,
116
+ 5CCBC68B2CA1F7A000E958D0 /* Parsing.swift */,
117
+ 5CCBC6892CA1F7A000E958D0 /* PromptTemplate.swift */,
118
+ 5CCBC68C2CA1F7A100E958D0 /* SystemPrompts.swift */,
119
+ 5CCBC60B2CA1F04A00E958D0 /* LocalInference.h */,
120
+ );
121
+ path = LocalInferenceImpl;
122
+ sourceTree = "<group>";
123
+ };
124
+ 5CCBC6772CA1F63F00E958D0 /* Products */ = {
125
+ isa = PBXGroup;
126
+ children = (
127
+ 5CCBC67E2CA1F63F00E958D0 /* LLaMA.app */,
128
+ 5CCBC6802CA1F63F00E958D0 /* LLaMARunner.framework */,
129
+ 5CCBC69F2CA2036B00E958D0 /* LLaMAPerfBenchmark.app */,
130
+ 5CCBC6A12CA2036B00E958D0 /* LLaMAPerfBenchmarkTests.xctest */,
131
+ );
132
+ name = Products;
133
+ sourceTree = "<group>";
134
+ };
135
+ 5CCBC6852CA1F64A00E958D0 /* Frameworks */ = {
136
+ isa = PBXGroup;
137
+ children = (
138
+ );
139
+ name = Frameworks;
140
+ sourceTree = "<group>";
141
+ };
142
+ /* End PBXGroup section */
143
+
144
+ /* Begin PBXHeadersBuildPhase section */
145
+ 5CCBC6032CA1F04A00E958D0 /* Headers */ = {
146
+ isa = PBXHeadersBuildPhase;
147
+ buildActionMask = 2147483647;
148
+ files = (
149
+ 5CCBC60C2CA1F04A00E958D0 /* LocalInference.h in Headers */,
150
+ );
151
+ runOnlyForDeploymentPostprocessing = 0;
152
+ };
153
+ /* End PBXHeadersBuildPhase section */
154
+
155
+ /* Begin PBXNativeTarget section */
156
+ 5CCBC6072CA1F04A00E958D0 /* LocalInferenceImpl */ = {
157
+ isa = PBXNativeTarget;
158
+ buildConfigurationList = 5CCBC60F2CA1F04A00E958D0 /* Build configuration list for PBXNativeTarget "LocalInferenceImpl" */;
159
+ buildPhases = (
160
+ 5CCBC6032CA1F04A00E958D0 /* Headers */,
161
+ 5CCBC6042CA1F04A00E958D0 /* Sources */,
162
+ 5CCBC6052CA1F04A00E958D0 /* Frameworks */,
163
+ 5CCBC6062CA1F04A00E958D0 /* Resources */,
164
+ 5CCBC6882CA1F64A00E958D0 /* Embed Frameworks */,
165
+ );
166
+ buildRules = (
167
+ );
168
+ dependencies = (
169
+ );
170
+ name = LocalInferenceImpl;
171
+ packageProductDependencies = (
172
+ 5CCBC6742CA1F45800E958D0 /* executorch_debug */,
173
+ 5CCBC6922CA1F7D000E958D0 /* Stencil */,
174
+ 5CADC7192CA471CC007662D2 /* LlamaStackClient */,
175
+ 5CAF3DD72CA485740029CD2B /* LlamaStackClient */,
176
+ );
177
+ productName = LocalInferenceProvider;
178
+ productReference = 5CCBC6082CA1F04A00E958D0 /* LocalInferenceImpl.framework */;
179
+ productType = "com.apple.product-type.framework";
180
+ };
181
+ /* End PBXNativeTarget section */
182
+
183
+ /* Begin PBXProject section */
184
+ 5CCBC5FF2CA1F04A00E958D0 /* Project object */ = {
185
+ isa = PBXProject;
186
+ attributes = {
187
+ BuildIndependentTargetsInParallel = 1;
188
+ LastUpgradeCheck = 1540;
189
+ TargetAttributes = {
190
+ 5CCBC6072CA1F04A00E958D0 = {
191
+ CreatedOnToolsVersion = 15.4;
192
+ LastSwiftMigration = 1540;
193
+ };
194
+ };
195
+ };
196
+ buildConfigurationList = 5CCBC6022CA1F04A00E958D0 /* Build configuration list for PBXProject "LocalInferenceImpl" */;
197
+ compatibilityVersion = "Xcode 14.0";
198
+ developmentRegion = en;
199
+ hasScannedForEncodings = 0;
200
+ knownRegions = (
201
+ en,
202
+ Base,
203
+ );
204
+ mainGroup = 5CCBC5FE2CA1F04A00E958D0;
205
+ packageReferences = (
206
+ 5CCBC6732CA1F45800E958D0 /* XCRemoteSwiftPackageReference "executorch" */,
207
+ 5CCBC6912CA1F7D000E958D0 /* XCRemoteSwiftPackageReference "Stencil" */,
208
+ 5CAF3DD62CA485740029CD2B /* XCRemoteSwiftPackageReference "llama-stack-client-swift" */,
209
+ );
210
+ productRefGroup = 5CCBC6092CA1F04A00E958D0 /* Products */;
211
+ projectDirPath = "";
212
+ projectReferences = (
213
+ {
214
+ ProductGroup = 5CCBC6772CA1F63F00E958D0 /* Products */;
215
+ ProjectRef = 5CCBC6762CA1F63F00E958D0 /* LLaMA.xcodeproj */;
216
+ },
217
+ );
218
+ projectRoot = "";
219
+ targets = (
220
+ 5CCBC6072CA1F04A00E958D0 /* LocalInferenceImpl */,
221
+ );
222
+ };
223
+ /* End PBXProject section */
224
+
225
+ /* Begin PBXReferenceProxy section */
226
+ 5CCBC67E2CA1F63F00E958D0 /* LLaMA.app */ = {
227
+ isa = PBXReferenceProxy;
228
+ fileType = wrapper.application;
229
+ path = LLaMA.app;
230
+ remoteRef = 5CCBC67D2CA1F63F00E958D0 /* PBXContainerItemProxy */;
231
+ sourceTree = BUILT_PRODUCTS_DIR;
232
+ };
233
+ 5CCBC6802CA1F63F00E958D0 /* LLaMARunner.framework */ = {
234
+ isa = PBXReferenceProxy;
235
+ fileType = wrapper.framework;
236
+ path = LLaMARunner.framework;
237
+ remoteRef = 5CCBC67F2CA1F63F00E958D0 /* PBXContainerItemProxy */;
238
+ sourceTree = BUILT_PRODUCTS_DIR;
239
+ };
240
+ 5CCBC69F2CA2036B00E958D0 /* LLaMAPerfBenchmark.app */ = {
241
+ isa = PBXReferenceProxy;
242
+ fileType = wrapper.application;
243
+ path = LLaMAPerfBenchmark.app;
244
+ remoteRef = 5CCBC69E2CA2036B00E958D0 /* PBXContainerItemProxy */;
245
+ sourceTree = BUILT_PRODUCTS_DIR;
246
+ };
247
+ 5CCBC6A12CA2036B00E958D0 /* LLaMAPerfBenchmarkTests.xctest */ = {
248
+ isa = PBXReferenceProxy;
249
+ fileType = wrapper.cfbundle;
250
+ path = LLaMAPerfBenchmarkTests.xctest;
251
+ remoteRef = 5CCBC6A02CA2036B00E958D0 /* PBXContainerItemProxy */;
252
+ sourceTree = BUILT_PRODUCTS_DIR;
253
+ };
254
+ /* End PBXReferenceProxy section */
255
+
256
+ /* Begin PBXResourcesBuildPhase section */
257
+ 5CCBC6062CA1F04A00E958D0 /* Resources */ = {
258
+ isa = PBXResourcesBuildPhase;
259
+ buildActionMask = 2147483647;
260
+ files = (
261
+ );
262
+ runOnlyForDeploymentPostprocessing = 0;
263
+ };
264
+ /* End PBXResourcesBuildPhase section */
265
+
266
+ /* Begin PBXSourcesBuildPhase section */
267
+ 5CCBC6042CA1F04A00E958D0 /* Sources */ = {
268
+ isa = PBXSourcesBuildPhase;
269
+ buildActionMask = 2147483647;
270
+ files = (
271
+ 5CCBC6902CA1F7A100E958D0 /* SystemPrompts.swift in Sources */,
272
+ 5CCBC68D2CA1F7A100E958D0 /* PromptTemplate.swift in Sources */,
273
+ 5CCBC68F2CA1F7A100E958D0 /* Parsing.swift in Sources */,
274
+ 5CCBC68E2CA1F7A100E958D0 /* LocalInference.swift in Sources */,
275
+ );
276
+ runOnlyForDeploymentPostprocessing = 0;
277
+ };
278
+ /* End PBXSourcesBuildPhase section */
279
+
280
+ /* Begin XCBuildConfiguration section */
281
+ 5CCBC60D2CA1F04A00E958D0 /* Debug */ = {
282
+ isa = XCBuildConfiguration;
283
+ buildSettings = {
284
+ ALWAYS_SEARCH_USER_PATHS = NO;
285
+ ASSETCATALOG_COMPILER_GENERATE_SWIFT_ASSET_SYMBOL_EXTENSIONS = YES;
286
+ CLANG_ANALYZER_NONNULL = YES;
287
+ CLANG_ANALYZER_NUMBER_OBJECT_CONVERSION = YES_AGGRESSIVE;
288
+ CLANG_CXX_LANGUAGE_STANDARD = "gnu++20";
289
+ CLANG_ENABLE_MODULES = YES;
290
+ CLANG_ENABLE_OBJC_ARC = YES;
291
+ CLANG_ENABLE_OBJC_WEAK = YES;
292
+ CLANG_WARN_BLOCK_CAPTURE_AUTORELEASING = YES;
293
+ CLANG_WARN_BOOL_CONVERSION = YES;
294
+ CLANG_WARN_COMMA = YES;
295
+ CLANG_WARN_CONSTANT_CONVERSION = YES;
296
+ CLANG_WARN_DEPRECATED_OBJC_IMPLEMENTATIONS = YES;
297
+ CLANG_WARN_DIRECT_OBJC_ISA_USAGE = YES_ERROR;
298
+ CLANG_WARN_DOCUMENTATION_COMMENTS = YES;
299
+ CLANG_WARN_EMPTY_BODY = YES;
300
+ CLANG_WARN_ENUM_CONVERSION = YES;
301
+ CLANG_WARN_INFINITE_RECURSION = YES;
302
+ CLANG_WARN_INT_CONVERSION = YES;
303
+ CLANG_WARN_NON_LITERAL_NULL_CONVERSION = YES;
304
+ CLANG_WARN_OBJC_IMPLICIT_RETAIN_SELF = YES;
305
+ CLANG_WARN_OBJC_LITERAL_CONVERSION = YES;
306
+ CLANG_WARN_OBJC_ROOT_CLASS = YES_ERROR;
307
+ CLANG_WARN_QUOTED_INCLUDE_IN_FRAMEWORK_HEADER = YES;
308
+ CLANG_WARN_RANGE_LOOP_ANALYSIS = YES;
309
+ CLANG_WARN_STRICT_PROTOTYPES = YES;
310
+ CLANG_WARN_SUSPICIOUS_MOVE = YES;
311
+ CLANG_WARN_UNGUARDED_AVAILABILITY = YES_AGGRESSIVE;
312
+ CLANG_WARN_UNREACHABLE_CODE = YES;
313
+ CLANG_WARN__DUPLICATE_METHOD_MATCH = YES;
314
+ COPY_PHASE_STRIP = NO;
315
+ CURRENT_PROJECT_VERSION = 1;
316
+ DEBUG_INFORMATION_FORMAT = dwarf;
317
+ ENABLE_STRICT_OBJC_MSGSEND = YES;
318
+ ENABLE_TESTABILITY = YES;
319
+ ENABLE_USER_SCRIPT_SANDBOXING = YES;
320
+ GCC_C_LANGUAGE_STANDARD = gnu17;
321
+ GCC_DYNAMIC_NO_PIC = NO;
322
+ GCC_NO_COMMON_BLOCKS = YES;
323
+ GCC_OPTIMIZATION_LEVEL = 0;
324
+ GCC_PREPROCESSOR_DEFINITIONS = (
325
+ "DEBUG=1",
326
+ "$(inherited)",
327
+ );
328
+ GCC_WARN_64_TO_32_BIT_CONVERSION = YES;
329
+ GCC_WARN_ABOUT_RETURN_TYPE = YES_ERROR;
330
+ GCC_WARN_UNDECLARED_SELECTOR = YES;
331
+ GCC_WARN_UNINITIALIZED_AUTOS = YES_AGGRESSIVE;
332
+ GCC_WARN_UNUSED_FUNCTION = YES;
333
+ GCC_WARN_UNUSED_VARIABLE = YES;
334
+ IPHONEOS_DEPLOYMENT_TARGET = 17.5;
335
+ LOCALIZATION_PREFERS_STRING_CATALOGS = YES;
336
+ MTL_ENABLE_DEBUG_INFO = INCLUDE_SOURCE;
337
+ MTL_FAST_MATH = YES;
338
+ ONLY_ACTIVE_ARCH = YES;
339
+ SDKROOT = iphoneos;
340
+ SWIFT_ACTIVE_COMPILATION_CONDITIONS = "DEBUG $(inherited)";
341
+ SWIFT_OPTIMIZATION_LEVEL = "-Onone";
342
+ VERSIONING_SYSTEM = "apple-generic";
343
+ VERSION_INFO_PREFIX = "";
344
+ };
345
+ name = Debug;
346
+ };
347
+ 5CCBC60E2CA1F04A00E958D0 /* Release */ = {
348
+ isa = XCBuildConfiguration;
349
+ buildSettings = {
350
+ ALWAYS_SEARCH_USER_PATHS = NO;
351
+ ASSETCATALOG_COMPILER_GENERATE_SWIFT_ASSET_SYMBOL_EXTENSIONS = YES;
352
+ CLANG_ANALYZER_NONNULL = YES;
353
+ CLANG_ANALYZER_NUMBER_OBJECT_CONVERSION = YES_AGGRESSIVE;
354
+ CLANG_CXX_LANGUAGE_STANDARD = "gnu++20";
355
+ CLANG_ENABLE_MODULES = YES;
356
+ CLANG_ENABLE_OBJC_ARC = YES;
357
+ CLANG_ENABLE_OBJC_WEAK = YES;
358
+ CLANG_WARN_BLOCK_CAPTURE_AUTORELEASING = YES;
359
+ CLANG_WARN_BOOL_CONVERSION = YES;
360
+ CLANG_WARN_COMMA = YES;
361
+ CLANG_WARN_CONSTANT_CONVERSION = YES;
362
+ CLANG_WARN_DEPRECATED_OBJC_IMPLEMENTATIONS = YES;
363
+ CLANG_WARN_DIRECT_OBJC_ISA_USAGE = YES_ERROR;
364
+ CLANG_WARN_DOCUMENTATION_COMMENTS = YES;
365
+ CLANG_WARN_EMPTY_BODY = YES;
366
+ CLANG_WARN_ENUM_CONVERSION = YES;
367
+ CLANG_WARN_INFINITE_RECURSION = YES;
368
+ CLANG_WARN_INT_CONVERSION = YES;
369
+ CLANG_WARN_NON_LITERAL_NULL_CONVERSION = YES;
370
+ CLANG_WARN_OBJC_IMPLICIT_RETAIN_SELF = YES;
371
+ CLANG_WARN_OBJC_LITERAL_CONVERSION = YES;
372
+ CLANG_WARN_OBJC_ROOT_CLASS = YES_ERROR;
373
+ CLANG_WARN_QUOTED_INCLUDE_IN_FRAMEWORK_HEADER = YES;
374
+ CLANG_WARN_RANGE_LOOP_ANALYSIS = YES;
375
+ CLANG_WARN_STRICT_PROTOTYPES = YES;
376
+ CLANG_WARN_SUSPICIOUS_MOVE = YES;
377
+ CLANG_WARN_UNGUARDED_AVAILABILITY = YES_AGGRESSIVE;
378
+ CLANG_WARN_UNREACHABLE_CODE = YES;
379
+ CLANG_WARN__DUPLICATE_METHOD_MATCH = YES;
380
+ COPY_PHASE_STRIP = NO;
381
+ CURRENT_PROJECT_VERSION = 1;
382
+ DEBUG_INFORMATION_FORMAT = "dwarf-with-dsym";
383
+ ENABLE_NS_ASSERTIONS = NO;
384
+ ENABLE_STRICT_OBJC_MSGSEND = YES;
385
+ ENABLE_USER_SCRIPT_SANDBOXING = YES;
386
+ GCC_C_LANGUAGE_STANDARD = gnu17;
387
+ GCC_NO_COMMON_BLOCKS = YES;
388
+ GCC_WARN_64_TO_32_BIT_CONVERSION = YES;
389
+ GCC_WARN_ABOUT_RETURN_TYPE = YES_ERROR;
390
+ GCC_WARN_UNDECLARED_SELECTOR = YES;
391
+ GCC_WARN_UNINITIALIZED_AUTOS = YES_AGGRESSIVE;
392
+ GCC_WARN_UNUSED_FUNCTION = YES;
393
+ GCC_WARN_UNUSED_VARIABLE = YES;
394
+ IPHONEOS_DEPLOYMENT_TARGET = 17.5;
395
+ LOCALIZATION_PREFERS_STRING_CATALOGS = YES;
396
+ MTL_ENABLE_DEBUG_INFO = NO;
397
+ MTL_FAST_MATH = YES;
398
+ SDKROOT = iphoneos;
399
+ SWIFT_COMPILATION_MODE = wholemodule;
400
+ VALIDATE_PRODUCT = YES;
401
+ VERSIONING_SYSTEM = "apple-generic";
402
+ VERSION_INFO_PREFIX = "";
403
+ };
404
+ name = Release;
405
+ };
406
+ 5CCBC6102CA1F04A00E958D0 /* Debug */ = {
407
+ isa = XCBuildConfiguration;
408
+ buildSettings = {
409
+ BUILD_LIBRARY_FOR_DISTRIBUTION = YES;
410
+ CLANG_ENABLE_MODULES = YES;
411
+ CODE_SIGN_STYLE = Automatic;
412
+ CURRENT_PROJECT_VERSION = 1;
413
+ DEFINES_MODULE = YES;
414
+ DYLIB_COMPATIBILITY_VERSION = 1;
415
+ DYLIB_CURRENT_VERSION = 1;
416
+ DYLIB_INSTALL_NAME_BASE = "@rpath";
417
+ ENABLE_MODULE_VERIFIER = YES;
418
+ GENERATE_INFOPLIST_FILE = YES;
419
+ HEADER_SEARCH_PATHS = "";
420
+ INFOPLIST_KEY_NSHumanReadableCopyright = "";
421
+ INSTALL_PATH = "$(LOCAL_LIBRARY_DIR)/Frameworks";
422
+ LD_RUNPATH_SEARCH_PATHS = (
423
+ "$(inherited)",
424
+ "@executable_path/Frameworks",
425
+ "@loader_path/Frameworks",
426
+ );
427
+ MARKETING_VERSION = 1.0;
428
+ MODULE_VERIFIER_SUPPORTED_LANGUAGES = "objective-c objective-c++";
429
+ MODULE_VERIFIER_SUPPORTED_LANGUAGE_STANDARDS = "gnu17 gnu++20";
430
+ OTHER_LDFLAGS = "";
431
+ PRODUCT_BUNDLE_IDENTIFIER = meta.llamatsack.LocalInferenceProvider;
432
+ PRODUCT_NAME = "$(TARGET_NAME:c99extidentifier)";
433
+ SKIP_INSTALL = YES;
434
+ SWIFT_EMIT_LOC_STRINGS = YES;
435
+ SWIFT_INSTALL_OBJC_HEADER = NO;
436
+ SWIFT_OPTIMIZATION_LEVEL = "-Onone";
437
+ SWIFT_VERSION = 5.0;
438
+ TARGETED_DEVICE_FAMILY = "1,2";
439
+ };
440
+ name = Debug;
441
+ };
442
+ 5CCBC6112CA1F04A00E958D0 /* Release */ = {
443
+ isa = XCBuildConfiguration;
444
+ buildSettings = {
445
+ BUILD_LIBRARY_FOR_DISTRIBUTION = YES;
446
+ CLANG_ENABLE_MODULES = YES;
447
+ CODE_SIGN_STYLE = Automatic;
448
+ CURRENT_PROJECT_VERSION = 1;
449
+ DEFINES_MODULE = YES;
450
+ DYLIB_COMPATIBILITY_VERSION = 1;
451
+ DYLIB_CURRENT_VERSION = 1;
452
+ DYLIB_INSTALL_NAME_BASE = "@rpath";
453
+ ENABLE_MODULE_VERIFIER = YES;
454
+ GENERATE_INFOPLIST_FILE = YES;
455
+ HEADER_SEARCH_PATHS = "";
456
+ INFOPLIST_KEY_NSHumanReadableCopyright = "";
457
+ INSTALL_PATH = "$(LOCAL_LIBRARY_DIR)/Frameworks";
458
+ LD_RUNPATH_SEARCH_PATHS = (
459
+ "$(inherited)",
460
+ "@executable_path/Frameworks",
461
+ "@loader_path/Frameworks",
462
+ );
463
+ MARKETING_VERSION = 1.0;
464
+ MODULE_VERIFIER_SUPPORTED_LANGUAGES = "objective-c objective-c++";
465
+ MODULE_VERIFIER_SUPPORTED_LANGUAGE_STANDARDS = "gnu17 gnu++20";
466
+ OTHER_LDFLAGS = "";
467
+ PRODUCT_BUNDLE_IDENTIFIER = meta.llamatsack.LocalInferenceProvider;
468
+ PRODUCT_NAME = "$(TARGET_NAME:c99extidentifier)";
469
+ SKIP_INSTALL = YES;
470
+ SWIFT_EMIT_LOC_STRINGS = YES;
471
+ SWIFT_INSTALL_OBJC_HEADER = NO;
472
+ SWIFT_VERSION = 5.0;
473
+ TARGETED_DEVICE_FAMILY = "1,2";
474
+ };
475
+ name = Release;
476
+ };
477
+ /* End XCBuildConfiguration section */
478
+
479
+ /* Begin XCConfigurationList section */
480
+ 5CCBC6022CA1F04A00E958D0 /* Build configuration list for PBXProject "LocalInferenceImpl" */ = {
481
+ isa = XCConfigurationList;
482
+ buildConfigurations = (
483
+ 5CCBC60D2CA1F04A00E958D0 /* Debug */,
484
+ 5CCBC60E2CA1F04A00E958D0 /* Release */,
485
+ );
486
+ defaultConfigurationIsVisible = 0;
487
+ defaultConfigurationName = Release;
488
+ };
489
+ 5CCBC60F2CA1F04A00E958D0 /* Build configuration list for PBXNativeTarget "LocalInferenceImpl" */ = {
490
+ isa = XCConfigurationList;
491
+ buildConfigurations = (
492
+ 5CCBC6102CA1F04A00E958D0 /* Debug */,
493
+ 5CCBC6112CA1F04A00E958D0 /* Release */,
494
+ );
495
+ defaultConfigurationIsVisible = 0;
496
+ defaultConfigurationName = Release;
497
+ };
498
+ /* End XCConfigurationList section */
499
+
500
+ /* Begin XCRemoteSwiftPackageReference section */
501
+ 5CAF3DD62CA485740029CD2B /* XCRemoteSwiftPackageReference "llama-stack-client-swift" */ = {
502
+ isa = XCRemoteSwiftPackageReference;
503
+ repositoryURL = "https://github.com/meta-llama/llama-stack-client-swift";
504
+ requirement = {
505
+ branch = main;
506
+ kind = branch;
507
+ };
508
+ };
509
+ 5CCBC6732CA1F45800E958D0 /* XCRemoteSwiftPackageReference "executorch" */ = {
510
+ isa = XCRemoteSwiftPackageReference;
511
+ repositoryURL = "https://github.com/pytorch/executorch";
512
+ requirement = {
513
+ branch = latest;
514
+ kind = branch;
515
+ };
516
+ };
517
+ 5CCBC6912CA1F7D000E958D0 /* XCRemoteSwiftPackageReference "Stencil" */ = {
518
+ isa = XCRemoteSwiftPackageReference;
519
+ repositoryURL = "https://github.com/stencilproject/Stencil";
520
+ requirement = {
521
+ kind = upToNextMajorVersion;
522
+ minimumVersion = 0.15.1;
523
+ };
524
+ };
525
+ /* End XCRemoteSwiftPackageReference section */
526
+
527
+ /* Begin XCSwiftPackageProductDependency section */
528
+ 5CADC7192CA471CC007662D2 /* LlamaStackClient */ = {
529
+ isa = XCSwiftPackageProductDependency;
530
+ productName = LlamaStackClient;
531
+ };
532
+ 5CAF3DD72CA485740029CD2B /* LlamaStackClient */ = {
533
+ isa = XCSwiftPackageProductDependency;
534
+ package = 5CAF3DD62CA485740029CD2B /* XCRemoteSwiftPackageReference "llama-stack-client-swift" */;
535
+ productName = LlamaStackClient;
536
+ };
537
+ 5CCBC6742CA1F45800E958D0 /* executorch_debug */ = {
538
+ isa = XCSwiftPackageProductDependency;
539
+ package = 5CCBC6732CA1F45800E958D0 /* XCRemoteSwiftPackageReference "executorch" */;
540
+ productName = executorch_debug;
541
+ };
542
+ 5CCBC6922CA1F7D000E958D0 /* Stencil */ = {
543
+ isa = XCSwiftPackageProductDependency;
544
+ package = 5CCBC6912CA1F7D000E958D0 /* XCRemoteSwiftPackageReference "Stencil" */;
545
+ productName = Stencil;
546
+ };
547
+ /* End XCSwiftPackageProductDependency section */
548
+ };
549
+ rootObject = 5CCBC5FF2CA1F04A00E958D0 /* Project object */;
550
+ }
@@ -0,0 +1,7 @@
1
+ <?xml version="1.0" encoding="UTF-8"?>
2
+ <Workspace
3
+ version = "1.0">
4
+ <FileRef
5
+ location = "self:">
6
+ </FileRef>
7
+ </Workspace>
@@ -0,0 +1,8 @@
1
+ <?xml version="1.0" encoding="UTF-8"?>
2
+ <!DOCTYPE plist PUBLIC "-//Apple//DTD PLIST 1.0//EN" "http://www.apple.com/DTDs/PropertyList-1.0.dtd">
3
+ <plist version="1.0">
4
+ <dict>
5
+ <key>IDEDidComputeMac32BitWarning</key>
6
+ <true/>
7
+ </dict>
8
+ </plist>
@@ -0,0 +1,74 @@
1
+ # NVIDIA DatasetIO Provider for LlamaStack
2
+
3
+ This provider enables dataset management using NVIDIA's NeMo Customizer service.
4
+
5
+ ## Features
6
+
7
+ - Register datasets for fine-tuning LLMs
8
+ - Unregister datasets
9
+
10
+ ## Getting Started
11
+
12
+ ### Prerequisites
13
+
14
+ - LlamaStack with NVIDIA configuration
15
+ - Access to Hosted NVIDIA NeMo Microservice
16
+ - API key for authentication with the NVIDIA service
17
+
18
+ ### Setup
19
+
20
+ Build the NVIDIA environment:
21
+
22
+ ```bash
23
+ uv pip install llama-stack-client
24
+ uv run llama stack list-deps nvidia | xargs -L1 uv pip install
25
+ ```
26
+
27
+ ### Basic Usage using the LlamaStack Python Client
28
+
29
+ #### Initialize the client
30
+
31
+ ```python
32
+ import os
33
+
34
+ os.environ["NVIDIA_API_KEY"] = "your-api-key"
35
+ os.environ["NVIDIA_CUSTOMIZER_URL"] = "http://nemo.test"
36
+ os.environ["NVIDIA_DATASET_NAMESPACE"] = "default"
37
+ os.environ["NVIDIA_PROJECT_ID"] = "test-project"
38
+ from llama_stack.core.library_client import LlamaStackAsLibraryClient
39
+
40
+ client = LlamaStackAsLibraryClient("nvidia")
41
+ client.initialize()
42
+ ```
43
+
44
+ #### Register a dataset
45
+
46
+ ```python
47
+ client.datasets.register(
48
+ purpose="post-training/messages",
49
+ dataset_id="my-training-dataset",
50
+ source={"type": "uri", "uri": "hf://datasets/default/sample-dataset"},
51
+ metadata={
52
+ "format": "json",
53
+ "description": "Dataset for LLM fine-tuning",
54
+ "provider": "nvidia",
55
+ },
56
+ )
57
+ ```
58
+
59
+ #### Get a list of all registered datasets
60
+
61
+ ```python
62
+ datasets = client.datasets.list()
63
+ for dataset in datasets:
64
+ print(f"Dataset ID: {dataset.identifier}")
65
+ print(f"Description: {dataset.metadata.get('description', '')}")
66
+ print(f"Source: {dataset.source.uri}")
67
+ print("---")
68
+ ```
69
+
70
+ #### Unregister a dataset
71
+
72
+ ```python
73
+ client.datasets.unregister(dataset_id="my-training-dataset")
74
+ ```