adding metadata of whisper-wrapper.v7

clams-bot · clams-bot · commit 65306f602fdd · 2024-06-24T20:24:24.000Z
diff --git a/docs/_apps/whisper-wrapper/v7/index.md b/docs/_apps/whisper-wrapper/v7/index.md
@@ -0,0 +1,90 @@
+---
+layout: posts
+classes: wide
+title: "Whisper Wrapper (v7)"
+date: 2024-06-24T20:24:22+00:00
+---
+## About this version
+
+- Submitter: [keighrim](https://github.com/keighrim)
+- Submission Time: 2024-06-24T20:24:22+00:00
+- Prebuilt Container Image: [ghcr.io/clamsproject/app-whisper-wrapper:v7](https://github.com/clamsproject/app-whisper-wrapper/pkgs/container/app-whisper-wrapper/v7)
+- Release Notes
+
+    > - Fixed minor typos in parameters  
+    > - Updated to clams-python 1.2.4, and added `cli.py` interface
+
+## About this app (See raw [metadata.json](metadata.json))
+
+**A CLAMS wrapper for Whisper-based ASR software originally developed by OpenAI.**
+
+- App ID: [http://apps.clams.ai/whisper-wrapper/v7](http://apps.clams.ai/whisper-wrapper/v7)
+- App License: Apache 2.0
+- Source Repository: [https://github.com/clamsproject/app-whisper-wrapper](https://github.com/clamsproject/app-whisper-wrapper) ([source tree of the submitted version](https://github.com/clamsproject/app-whisper-wrapper/tree/v7))
+- Analyzer Version: 20231117
+- Analyzer License: MIT
+
+
+#### Inputs
+(**Note**: "*" as a property value means that the property is required but can be any value.)
+
+One of the following is required: [
+- [http://mmif.clams.ai/vocabulary/AudioDocument/v1](http://mmif.clams.ai/vocabulary/AudioDocument/v1) (required)
+(of any properties)
+
+- [http://mmif.clams.ai/vocabulary/VideoDocument/v1](http://mmif.clams.ai/vocabulary/VideoDocument/v1) (required)
+(of any properties)
+
+
+
+]
+
+
+#### Configurable Parameters
+(**Note**: _Multivalued_ means the parameter can have one or more values.)
+
+- `modelSize`: optional, defaults to `tiny`
+
+    - Type: string
+    - Multivalued: False
+    - Choices: **_`tiny`_**, `True`, `base`, `b`, `small`, `s`, `medium`, `m`, `large`, `l`, `large-v2`, `l2`, `large-v3`, `l3`
+
+
+    > The size of the model to use. When `modelLang=en` is given, for non-`large` models, English-only models will be used instead of multilingual models for speed and accuracy. (For `large` models, English-only models are not available.)
+- `modelLang`: required
+
+    - Type: string
+    - Multivalued: False
+
+
+    > Language of the model to use, accepts two- or three-letter ISO 639 language codes, however Whisper only supports a subset of languages. If the language is not supported, error will be raised.For the full list of supported languages, see https://github.com/openai/whisper/blob/20231117/whisper/tokenizer.py . In addition to the langauge code, two-letter region codes can be added to the language code, e.g. "en-US" for US English. Note that the region code is only for compatibility and recording purpose, and Whisper neither detects regional dialects, nor use the given one for transcription. When the langauge code is not given, Whisper will run in langauge detection mode, and will use first few seconds of the audio to detect the language.
+- `pretty`: optional, defaults to `false`
+
+    - Type: boolean
+    - Multivalued: False
+    - Choices: **_`false`_**, `true`
+
+
+    > The JSON body of the HTTP response will be re-formatted with 2-space indentation
+
+
+#### Outputs
+(**Note**: "*" as a property value means that the property is required but can be any value.)
+
+(**Note**: Not all output annotations are always generated.)
+
+- [http://mmif.clams.ai/vocabulary/TextDocument/v1](http://mmif.clams.ai/vocabulary/TextDocument/v1)
+(of any properties)
+
+- [http://mmif.clams.ai/vocabulary/TimeFrame/v5](http://mmif.clams.ai/vocabulary/TimeFrame/v5)
+    - _timeUnit_ = "milliseconds"
+
+- [http://mmif.clams.ai/vocabulary/Alignment/v1](http://mmif.clams.ai/vocabulary/Alignment/v1)
+(of any properties)
+
+- [http://vocab.lappsgrid.org/Token](http://vocab.lappsgrid.org/Token)
+(of any properties)
+
+- [http://vocab.lappsgrid.org/Sentence](http://vocab.lappsgrid.org/Sentence)
+(of any properties)
+
diff --git a/docs/_apps/whisper-wrapper/v7/metadata.json b/docs/_apps/whisper-wrapper/v7/metadata.json
@@ -0,0 +1,82 @@
+{
+  "name": "Whisper Wrapper",
+  "description": "A CLAMS wrapper for Whisper-based ASR software originally developed by OpenAI.",
+  "app_version": "v7",
+  "mmif_version": "1.0.4",
+  "analyzer_version": "20231117",
+  "app_license": "Apache 2.0",
+  "analyzer_license": "MIT",
+  "identifier": "http://apps.clams.ai/whisper-wrapper/v7",
+  "url": "https://github.com/clamsproject/app-whisper-wrapper",
+  "input": [
+    [
+      {
+        "@type": "http://mmif.clams.ai/vocabulary/AudioDocument/v1",
+        "required": true
+      },
+      {
+        "@type": "http://mmif.clams.ai/vocabulary/VideoDocument/v1",
+        "required": true
+      }
+    ]
+  ],
+  "output": [
+    {
+      "@type": "http://mmif.clams.ai/vocabulary/TextDocument/v1"
+    },
+    {
+      "@type": "http://mmif.clams.ai/vocabulary/TimeFrame/v5",
+      "properties": {
+        "timeUnit": "milliseconds"
+      }
+    },
+    {
+      "@type": "http://mmif.clams.ai/vocabulary/Alignment/v1"
+    },
+    {
+      "@type": "http://vocab.lappsgrid.org/Token"
+    },
+    {
+      "@type": "http://vocab.lappsgrid.org/Sentence"
+    }
+  ],
+  "parameters": [
+    {
+      "name": "modelSize",
+      "description": "The size of the model to use. When `modelLang=en` is given, for non-`large` models, English-only models will be used instead of multilingual models for speed and accuracy. (For `large` models, English-only models are not available.)",
+      "type": "string",
+      "choices": [
+        "tiny",
+        true,
+        "base",
+        "b",
+        "small",
+        "s",
+        "medium",
+        "m",
+        "large",
+        "l",
+        "large-v2",
+        "l2",
+        "large-v3",
+        "l3"
+      ],
+      "default": "tiny",
+      "multivalued": false
+    },
+    {
+      "name": "modelLang",
+      "description": "Language of the model to use, accepts two- or three-letter ISO 639 language codes, however Whisper only supports a subset of languages. If the language is not supported, error will be raised.For the full list of supported languages, see https://github.com/openai/whisper/blob/20231117/whisper/tokenizer.py . In addition to the langauge code, two-letter region codes can be added to the language code, e.g. \"en-US\" for US English. Note that the region code is only for compatibility and recording purpose, and Whisper neither detects regional dialects, nor use the given one for transcription. When the langauge code is not given, Whisper will run in langauge detection mode, and will use first few seconds of the audio to detect the language.",
+      "type": "string",
+      "default": "",
+      "multivalued": false
+    },
+    {
+      "name": "pretty",
+      "description": "The JSON body of the HTTP response will be re-formatted with 2-space indentation",
+      "type": "boolean",
+      "default": false,
+      "multivalued": false
+    }
+  ]
+}
diff --git a/docs/_apps/whisper-wrapper/v7/submission.json b/docs/_apps/whisper-wrapper/v7/submission.json
@@ -0,0 +1,6 @@
+{
+  "time": "2024-06-24T20:24:22+00:00",
+  "submitter": "keighrim",
+  "image": "ghcr.io/clamsproject/app-whisper-wrapper:v7",
+  "releasenotes": "- Fixed minor typos in parameters\n- Updated to clams-python 1.2.4, and added `cli.py` interface\n\n"
+}
diff --git a/docs/_data/app-index.json b/docs/_data/app-index.json
@@ -1,4 +1,38 @@
 {
+  "http://apps.clams.ai/whisper-wrapper": {
+    "description": "A CLAMS wrapper for Whisper-based ASR software originally developed by OpenAI.",
+    "latest_update": "2024-06-24T20:24:22+00:00",
+    "versions": [
+      [
+        "v7",
+        "keighrim"
+      ],
+      [
+        "v6",
+        "keighrim"
+      ],
+      [
+        "v5",
+        "keighrim"
+      ],
+      [
+        "v4",
+        "keighrim"
+      ],
+      [
+        "v3",
+        "keighrim"
+      ],
+      [
+        "v2",
+        "keighrim"
+      ],
+      [
+        "v1",
+        "keighrim"
+      ]
+    ]
+  },
   "http://apps.clams.ai/east-textdetection": {
     "description": "OpenCV-based text localization app that used EAST text detection model. Please visit the source code repository for full documentation.",
     "latest_update": "2024-06-24T13:52:29+00:00",
@@ -175,36 +209,6 @@
       ]
     ]
   },
-  "http://apps.clams.ai/whisper-wrapper": {
-    "description": "A CLAMS wrapper for Whisper-based ASR software originally developed by OpenAI.",
-    "latest_update": "2024-02-12T19:47:39+00:00",
-    "versions": [
-      [
-        "v6",
-        "keighrim"
-      ],
-      [
-        "v5",
-        "keighrim"
-      ],
-      [
-        "v4",
-        "keighrim"
-      ],
-      [
-        "v3",
-        "keighrim"
-      ],
-      [
-        "v2",
-        "keighrim"
-      ],
-      [
-        "v1",
-        "keighrim"
-      ]
-    ]
-  },
   "http://apps.clams.ai/easyocr-wrapper": {
     "description": "Using EasyOCR to extract text from timeframes",
     "latest_update": "2024-01-30T19:59:06+00:00",
diff --git a/docs/_data/apps.json b/docs/_data/apps.json