michi-ai 0.1.0__tar.gz → 0.1.1__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -1,12 +1,12 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: michi-ai
3
- Version: 0.1.0
3
+ Version: 0.1.1
4
4
  Summary: Full-duplex speech LLM client for MichiAI
5
5
  Home-page: https://ketsuilabs.io
6
6
  License: Apache-2.0
7
7
  Keywords: llm,speech,full-duplex,audio
8
8
  Author: Damian Krystkiewicz
9
- Author-email: damian@ketsuilabs.io
9
+ Author-email: 45499236+dkrystki@users.noreply.github.com
10
10
  Requires-Python: >=3.9,<4.0
11
11
  Classifier: License :: OSI Approved :: Apache Software License
12
12
  Classifier: Programming Language :: Python :: 3
@@ -40,7 +40,7 @@ Unlike traditional serial pipelines (ASR → LLM → TTS), MichiAI can listen an
40
40
  | **Latency (TTFA)** | ~75ms (tested on RTX 4090) |
41
41
  | **Architecture** | Continuous Embeddings + Rectified Flow Matching |
42
42
  | **Base Backbone** | SmolLM-360m |
43
- | **Key Innovation** | No Coherence Loss / Single Forward Pass per Word |
43
+ | **Key Innovation** | No Coherence Loss / Single Step Decoding |
44
44
 
45
45
 
46
46
  ## 🌟 Key Features
@@ -56,7 +56,7 @@ Unlike traditional serial pipelines (ASR → LLM → TTS), MichiAI can listen an
56
56
  ## 🤖 Architecture Overview
57
57
 
58
58
  ### 1. The Listening Head
59
- A multi-modal encoder mapping raw audio into a continuous embeddings while simultaneously generating text tokens. This ensures the model understands both the semantic meaning and the emotional context.
59
+ A multi-modal encoder mapping raw audio into continuous embeddings while simultaneously generating text tokens. This ensures the model understands both the semantic meaning and the emotional context.
60
60
 
61
61
  ### 2. The Speaking Head
62
62
  Predicts audio embeddings using **Rectified Flow Matching**. This allows for fast, high-quality, and diverse speech generation. The embeddings are then processed through a lightweight, causal **HiFi-GAN vocoder** for real-time streaming.
@@ -21,7 +21,7 @@ Unlike traditional serial pipelines (ASR → LLM → TTS), MichiAI can listen an
21
21
  | **Latency (TTFA)** | ~75ms (tested on RTX 4090) |
22
22
  | **Architecture** | Continuous Embeddings + Rectified Flow Matching |
23
23
  | **Base Backbone** | SmolLM-360m |
24
- | **Key Innovation** | No Coherence Loss / Single Forward Pass per Word |
24
+ | **Key Innovation** | No Coherence Loss / Single Step Decoding |
25
25
 
26
26
 
27
27
  ## 🌟 Key Features
@@ -37,7 +37,7 @@ Unlike traditional serial pipelines (ASR → LLM → TTS), MichiAI can listen an
37
37
  ## 🤖 Architecture Overview
38
38
 
39
39
  ### 1. The Listening Head
40
- A multi-modal encoder mapping raw audio into a continuous embeddings while simultaneously generating text tokens. This ensures the model understands both the semantic meaning and the emotional context.
40
+ A multi-modal encoder mapping raw audio into continuous embeddings while simultaneously generating text tokens. This ensures the model understands both the semantic meaning and the emotional context.
41
41
 
42
42
  ### 2. The Speaking Head
43
43
  Predicts audio embeddings using **Rectified Flow Matching**. This allows for fast, high-quality, and diverse speech generation. The embeddings are then processed through a lightweight, causal **HiFi-GAN vocoder** for real-time streaming.
@@ -1,9 +1,9 @@
1
1
  [tool.poetry]
2
2
  name = "michi-ai"
3
- version = "0.1.0"
3
+ version = "0.1.1"
4
4
  description = "Full-duplex speech LLM client for MichiAI"
5
5
  license = "Apache-2.0"
6
- authors = ["Damian Krystkiewicz <damian@ketsuilabs.io>"]
6
+ authors = ["Damian Krystkiewicz <45499236+dkrystki@users.noreply.github.com>"]
7
7
  homepage = "https://ketsuilabs.io"
8
8
  repository = "https://github.com/KetsuiLabs/MichiAI"
9
9
  readme = "README.md"
File without changes
File without changes
File without changes