software-mansion
diff --git a/‎.cspell-wordlist.txt
Lines changed: 2 additions & 0 deletions b/‎.cspell-wordlist.txt
Lines changed: 2 additions & 0 deletions
diff --git a/‎docs/docs/benchmarks/inference-time.md
Lines changed: 6 additions & 3 deletions b/‎docs/docs/benchmarks/inference-time.md
Lines changed: 6 additions & 3 deletions
diff --git a/‎docs/docs/benchmarks/memory-usage.md
Lines changed: 6 additions & 3 deletions b/‎docs/docs/benchmarks/memory-usage.md
Lines changed: 6 additions & 3 deletions
diff --git a/‎docs/docs/benchmarks/model-size.md
Lines changed: 6 additions & 3 deletions b/‎docs/docs/benchmarks/model-size.md
Lines changed: 6 additions & 3 deletions
diff --git a/‎docs/docs/natural-language-processing/useLLM.md
Lines changed: 13 additions & 15 deletions b/‎docs/docs/natural-language-processing/useLLM.md
Lines changed: 13 additions & 15 deletions
diff --git a/‎docs/docs/natural-language-processing/useTextEmbeddings.md
Lines changed: 24 additions & 12 deletions b/‎docs/docs/natural-language-processing/useTextEmbeddings.md
Lines changed: 24 additions & 12 deletions
diff --git a/‎examples/speech-to-text/android/app/src/main/AndroidManifest.xml
Lines changed: 1 addition & 0 deletions b/‎examples/speech-to-text/android/app/src/main/AndroidManifest.xml
Lines changed: 1 addition & 0 deletions
diff --git a/‎examples/speech-to-text/android/app/src/main/java/com/anonymous/speechtotext/MainActivity.kt
Lines changed: 2 additions & 3 deletions b/‎examples/speech-to-text/android/app/src/main/java/com/anonymous/speechtotext/MainActivity.kt
Lines changed: 2 additions & 3 deletions
@@ -47,3 +47,5 @@ sublabel
 Aeonik
 Lexend
 finetuned
+MINILM
+MPNET
@@ -102,6 +102,9 @@ Average time for decoding one token in sequence of 100 tokens, with encoding con
 
 ## Text Embeddings
 
-| Model            | iPhone 16 Pro (XNNPACK) [ms] | iPhone 14 Pro Max (XNNPACK) [ms] | iPhone SE 3 (XNNPACK) [ms] | Samsung Galaxy S24 (XNNPACK) | OnePlus 12 (XNNPACK) [ms] |
-| ---------------- | :--------------------------: | :------------------------------: | :------------------------: | :--------------------------: | :-----------------------: |
-| ALL_MINILM_L6_V2 |             105              |               126                |            151             |             165              |            152            |
+| Model                      | iPhone 16 Pro (XNNPACK) [ms] | iPhone 14 Pro Max (XNNPACK) [ms] | iPhone SE 3 (XNNPACK) [ms] | Samsung Galaxy S24 (XNNPACK) | OnePlus 12 (XNNPACK) [ms] |
+| -------------------------- | :--------------------------: | :------------------------------: | :------------------------: | :--------------------------: | :-----------------------: |
+| ALL_MINILM_L6_V2           |              53              |                69                |             78             |              60              |            65             |
+| ALL_MPNET_BASE_V2          |             352              |               423                |            478             |             521              |            527            |
+| MULTI_QA_MINILM_L6_COS_V1  |             135              |               166                |            180             |             158              |            165            |
+| MULTI_QA_MPNET_BASE_DOT_V1 |             503              |               598                |            680             |             694              |            743            |
@@ -57,6 +57,9 @@ sidebar_position: 2
 
 ## Text Embeddings
 
-| Model            | Android (XNNPACK) [MB] | iOS (XNNPACK) [MB] |
-| ---------------- | :--------------------: | :----------------: |
-| ALL_MINILM_L6_V2 |          140           |         64         |
+| Model                      | Android (XNNPACK) [MB] | iOS (XNNPACK) [MB] |
+| -------------------------- | :--------------------: | :----------------: |
+| ALL_MINILM_L6_V2           |          150           |        190         |
+| ALL_MPNET_BASE_V2          |          520           |        470         |
+| MULTI_QA_MINILM_L6_COS_V1  |          160           |        225         |
+| MULTI_QA_MPNET_BASE_DOT_V1 |          540           |        500         |
@@ -66,6 +66,9 @@ sidebar_position: 1
 
 ## Text Embeddings
 
-| Model            | XNNPACK [MB] |
-| ---------------- | :----------: |
-| ALL_MINILM_L6_V2 |      91      |
+| Model                      | XNNPACK [MB] |
+| -------------------------- | :----------: |
+| ALL_MINILM_L6_V2           |      91      |
+| ALL_MPNET_BASE_V2          |     438      |
+| MULTI_QA_MINILM_L6_COS_V1  |      91      |
+| MULTI_QA_MPNET_BASE_DOT_V1 |     438      |
@@ -75,7 +75,6 @@ interface LLMType {
     chatConfig?: Partial<ChatConfig>;
     toolsConfig?: ToolsConfig;
   }) => void;
-  forward: (input: string) => Promise<void>;
   generate: (messages: Message[], tools?: LLMTool[]) => Promise<void>;
   sendMessage: (message: string) => Promise<void>;
   deleteMessage: (index: number) => void;
@@ -137,20 +136,19 @@ Given computational constraints, our architecture is designed to support only on
 
 ### Returns
 
-| Field              | Type                                                                        | Description                                                                                                                                                                                                                                                                                                                                                             |
-| ------------------ | --------------------------------------------------------------------------- | ----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------- |
-| `messageHistory`   | `Message[]`                                                                 | History containing all messages in conversation. This field is updated after model responds to `sendMessage`.                                                                                                                                                                                                                                                           |
-| `response`         | `string`                                                                    | State of the generated response. This field is updated with each token generated by the model.                                                                                                                                                                                                                                                                          |
-| `isReady`          | `boolean`                                                                   | Indicates whether the model is ready.                                                                                                                                                                                                                                                                                                                                   |
-| `isGenerating`     | `boolean`                                                                   | Indicates whether the model is currently generating a response.                                                                                                                                                                                                                                                                                                         |
-| `downloadProgress` | `number`                                                                    | Represents the download progress as a value between 0 and 1, indicating the extent of the model file retrieval.                                                                                                                                                                                                                                                         |
-| `error`            | <code>string &#124; null</code>                                             | Contains the error message if the model failed to load.                                                                                                                                                                                                                                                                                                                 |
-| `configure`        | `({ chatConfig?: Partial<ChatConfig>, toolsConfig?: ToolsConfig }) => void` | Configures chat and tool calling. See more details in [configuring the model](#configuring-the-model).                                                                                                                                                                                                                                                                  |
-| `sendMessage`      | `(message: string, tools?: LLMTool[]) => Promise<void>`                     | Method to add user message to conversation. After model responds, `messageHistory` will be updated with both user message and model response.                                                                                                                                                                                                                           |
-| `deleteMessage`    | `(index: number) => void`                                                   | Deletes all messages starting with message on `index` position. After deletion `messageHistory` will be updated.                                                                                                                                                                                                                                                        |
-| `generate`         | `(messages: Message[], tools?: LLMTool[]) => Promise<void>`                 | Runs model to complete chat passed in `messages` argument. It doesn't manage conversation context.                                                                                                                                                                                                                                                                      |
-| `forward`          | `(input: string) => Promise<void>`                                          | Runs model inference with raw input string. You need to provide entire conversation and prompt (in correct format and with special tokens!) in input string to this method. It doesn't manage conversation context. It is intended for users that need access to the model itself without any wrapper. If you want simple chat with model consider using `sendMessage`. |
-| `interrupt`        | `() => void`                                                                | Function to interrupt the current inference.                                                                                                                                                                                                                                                                                                                            |
+| Field              | Type                                                                        | Description                                                                                                                                   |
+| ------------------ | --------------------------------------------------------------------------- | --------------------------------------------------------------------------------------------------------------------------------------------- |
+| `messageHistory`   | `Message[]`                                                                 | History containing all messages in conversation. This field is updated after model responds to `sendMessage`.                                 |
+| `response`         | `string`                                                                    | State of the generated response. This field is updated with each token generated by the model.                                                |
+| `isReady`          | `boolean`                                                                   | Indicates whether the model is ready.                                                                                                         |
+| `isGenerating`     | `boolean`                                                                   | Indicates whether the model is currently generating a response.                                                                               |
+| `downloadProgress` | `number`                                                                    | Represents the download progress as a value between 0 and 1, indicating the extent of the model file retrieval.                               |
+| `error`            | <code>string &#124; null</code>                                             | Contains the error message if the model failed to load.                                                                                       |
+| `configure`        | `({ chatConfig?: Partial<ChatConfig>, toolsConfig?: ToolsConfig }) => void` | Configures chat and tool calling. See more details in [configuring the model](#configuring-the-model).                                        |
+| `sendMessage`      | `(message: string, tools?: LLMTool[]) => Promise<void>`                     | Method to add user message to conversation. After model responds, `messageHistory` will be updated with both user message and model response. |
+| `deleteMessage`    | `(index: number) => void`                                                   | Deletes all messages starting with message on `index` position. After deletion `messageHistory` will be updated.                              |
+| `generate`         | `(messages: Message[], tools?: LLMTool[]) => Promise<void>`                 | Runs model to complete chat passed in `messages` argument. It doesn't manage conversation context.                                            |
+| `interrupt`        | `() => void`                                                                | Function to interrupt the current inference.                                                                                                  |
 
 ## Configuring the model
 
 
@@ -110,9 +110,12 @@ function App() {
 
 ## Supported models
 
-| Model                                                                             | Language | Max Tokens | Embedding Dimensions |
-| --------------------------------------------------------------------------------- | :------: | :--------: | :------------------: |
-| [all-MiniLM-L6-v2](https://huggingface.co/sentence-transformers/all-MiniLM-L6-v2) | English  |    256     |         384          |
+| Model                                                                                                 | Language | Max Tokens | Embedding Dimensions | Description                                                                                                                                                             |
+| ----------------------------------------------------------------------------------------------------- | :------: | :--------: | :------------------: | ----------------------------------------------------------------------------------------------------------------------------------------------------------------------- |
+| [all-MiniLM-L6-v2](https://huggingface.co/sentence-transformers/all-MiniLM-L6-v2)                     | English  |    256     |         384          | All-round model tuned for many use-cases. Trained on a large and diverse dataset of over 1 billion training pairs.                                                      |
+| [all-mpnet-base-v2](https://huggingface.co/sentence-transformers/all-mpnet-base-v2)                   | English  |    384     |         768          | All-round model tuned for many use-cases. Trained on a large and diverse dataset of over 1 billion training pairs.                                                      |
+| [multi-qa-MiniLM-L6-cos-v1](https://huggingface.co/sentence-transformers/multi-qa-MiniLM-L6-cos-v1)   | English  |    511     |         384          | This model was tuned for semantic search: Given a query/question, it can find relevant passages. It was trained on a large and diverse set of (question, answer) pairs. |
+| [multi-qa-mpnet-base-dot-v1](https://huggingface.co/sentence-transformers/multi-qa-mpnet-base-dot-v1) | English  |    512     |         768          | This model was tuned for semantic search: Given a query/question, it can find relevant passages. It was trained on a large and diverse set of (question, answer) pairs. |
 
 **`Max Tokens`** - the maximum number of tokens that can be processed by the model. If the input text exceeds this limit, it will be truncated.
 
@@ -122,22 +125,31 @@ function App() {
 
 ### Model size
 
-| Model            | XNNPACK [MB] |
-| ---------------- | :----------: |
-| ALL_MINILM_L6_V2 |      91      |
+| Model                      | XNNPACK [MB] |
+| -------------------------- | :----------: |
+| ALL_MINILM_L6_V2           |      91      |
+| ALL_MPNET_BASE_V2          |     438      |
+| MULTI_QA_MINILM_L6_COS_V1  |      91      |
+| MULTI_QA_MPNET_BASE_DOT_V1 |     438      |
 
 ### Memory usage
 
-| Model            | Android (XNNPACK) [MB] | iOS (XNNPACK) [MB] |
-| ---------------- | :--------------------: | :----------------: |
-| ALL_MINILM_L6_V2 |          140           |         64         |
+| Model                      | Android (XNNPACK) [MB] | iOS (XNNPACK) [MB] |
+| -------------------------- | :--------------------: | :----------------: |
+| ALL_MINILM_L6_V2           |          150           |        190         |
+| ALL_MPNET_BASE_V2          |          520           |        470         |
+| MULTI_QA_MINILM_L6_COS_V1  |          160           |        225         |
+| MULTI_QA_MPNET_BASE_DOT_V1 |          540           |        500         |
 
 ### Inference time
 
 :::warning warning
 Times presented in the tables are measured as consecutive runs of the model. Initial run times may be up to 2x longer due to model loading and initialization.
 :::
 
-| Model            | iPhone 16 Pro (XNNPACK) [ms] | iPhone 14 Pro Max (XNNPACK) [ms] | iPhone SE 3 (XNNPACK) [ms] | Samsung Galaxy S24 (XNNPACK) | OnePlus 12 (XNNPACK) [ms] |
-| ---------------- | :--------------------------: | :------------------------------: | :------------------------: | :--------------------------: | :-----------------------: |
-| ALL_MINILM_L6_V2 |             105              |               126                |            151             |             165              |            152            |
+| Model                      | iPhone 16 Pro (XNNPACK) [ms] | iPhone 14 Pro Max (XNNPACK) [ms] | iPhone SE 3 (XNNPACK) [ms] | Samsung Galaxy S24 (XNNPACK) | OnePlus 12 (XNNPACK) [ms] |
+| -------------------------- | :--------------------------: | :------------------------------: | :------------------------: | :--------------------------: | :-----------------------: |
+| ALL_MINILM_L6_V2           |              53              |                69                |             78             |              60              |            65             |
+| ALL_MPNET_BASE_V2          |             352              |               423                |            478             |             521              |            527            |
+| MULTI_QA_MINILM_L6_COS_V1  |             135              |               166                |            180             |             158              |            165            |
+| MULTI_QA_MPNET_BASE_DOT_V1 |             503              |               598                |            680             |             694              |            743            |
@@ -1,6 +1,7 @@
 <manifest xmlns:android="http://schemas.android.com/apk/res/android">
   <uses-permission android:name="android.permission.INTERNET"/>
   <uses-permission android:name="android.permission.READ_EXTERNAL_STORAGE"/>
+  <uses-permission android:name="android.permission.RECORD_AUDIO"/>
   <uses-permission android:name="android.permission.SYSTEM_ALERT_WINDOW"/>
   <uses-permission android:name="android.permission.VIBRATE"/>
   <uses-permission android:name="android.permission.WRITE_EXTERNAL_STORAGE"/>
 
@@ -27,8 +27,8 @@ class MainActivity : ReactActivity() {
    * Returns the instance of the [ReactActivityDelegate]. We use [DefaultReactActivityDelegate]
    * which allows you to enable New Architecture with a single boolean flags [fabricEnabled]
    */
-  override fun createReactActivityDelegate(): ReactActivityDelegate {
-    return ReactActivityDelegateWrapper(
+  override fun createReactActivityDelegate(): ReactActivityDelegate =
+    ReactActivityDelegateWrapper(
       this,
       BuildConfig.IS_NEW_ARCHITECTURE_ENABLED,
       object : DefaultReactActivityDelegate(
@@ -37,7 +37,6 @@ class MainActivity : ReactActivity() {
         fabricEnabled,
       ) {},
     )
-  }
 
   /**
    * Align the back button behavior with Android S
-Original file line number
+Diff line change
 Aeonik
 Lexend
 finetuned
 +MINILM
 +MPNET