adding metadata of llava-captioner.v1.2

clams-bot · clams-bot · commit 1e9b7fe472ae · 2025-02-05T22:52:42.000Z
diff --git a/docs/_apps/llava-captioner/v1.2/index.md b/docs/_apps/llava-captioner/v1.2/index.md
@@ -0,0 +1,90 @@
+---
+layout: posts
+classes: wide
+title: "LLaVA Captioner (v1.2)"
+date: 2025-02-05T22:52:42+00:00
+---
+## About this version
+
+- Submitter: [kelleyl](https://github.com/kelleyl)
+- Submission Time: 2025-02-05T22:52:42+00:00
+- Prebuilt Container Image: [ghcr.io/clamsproject/app-llava-captioner:v1.2](https://github.com/clamsproject/app-llava-captioner/pkgs/container/app-llava-captioner/v1.2)
+- Release Notes
+
+    (no notes provided by the developer)
+
+## About this app (See raw [metadata.json](metadata.json))
+
+**Applies LLaVA v1.6 Mistral-7B to video frames for image captioning.**
+
+- App ID: [http://apps.clams.ai/llava-captioner/v1.2](http://apps.clams.ai/llava-captioner/v1.2)
+- App License: Apache 2.0
+- Source Repository: [https://github.com/clamsproject/app-llava-captioner](https://github.com/clamsproject/app-llava-captioner) ([source tree of the submitted version](https://github.com/clamsproject/app-llava-captioner/tree/v1.2))
+
+
+#### Inputs
+(**Note**: "*" as a property value means that the property is required but can be any value.)
+
+- [http://mmif.clams.ai/vocabulary/VideoDocument/v1](http://mmif.clams.ai/vocabulary/VideoDocument/v1) (required)
+(of any properties)
+
+- [http://mmif.clams.ai/vocabulary/ImageDocument/v1](http://mmif.clams.ai/vocabulary/ImageDocument/v1) (required)
+(of any properties)
+
+- [http://mmif.clams.ai/vocabulary/TimeFrame/v5](http://mmif.clams.ai/vocabulary/TimeFrame/v5) (required)
+(of any properties)
+
+
+
+#### Configurable Parameters
+(**Note**: _Multivalued_ means the parameter can have one or more values.)
+
+- `frameInterval`: optional, defaults to `30`
+
+    - Type: integer
+    - Multivalued: False
+
+
+    > The interval at which to extract frames from the video if there are no timeframe annotations. Default is every 30 frames.
+- `defaultPrompt`: optional, defaults to `Describe what is shown in this video frame. Analyze the purpose of this frame in the context of a news video. Transcribe any text present.`
+
+    - Type: string
+    - Multivalued: False
+
+
+    > default prompt to use for timeframes not specified in the promptMap. If set to `-`, timeframes not specified in the promptMap will be skipped.
+- `promptMap`: optional, defaults to `[]`
+
+    - Type: map
+    - Multivalued: True
+
+
+    > mapping of labels of the input timeframe annotations to new prompts. Must be formatted as "IN_LABEL:PROMPT" (with a colon). To pass multiple mappings, use this parameter multiple times. By default, any timeframe labels not mapped to a prompt will be used with the defaultprompt. In order to skip timeframes with a particular label, pass `-` as the prompt value.in order to skip all timeframes not specified in the promptMap, set the defaultPromptparameter to `-`
+- `config`: optional, defaults to `config/default.yaml`
+
+    - Type: string
+    - Multivalued: False
+
+
+    > Name of the config file to use.
+- `pretty`: optional, defaults to `false`
+
+    - Type: boolean
+    - Multivalued: False
+    - Choices: **_`false`_**, `true`
+
+
+    > The JSON body of the HTTP response will be re-formatted with 2-space indentation
+
+
+#### Outputs
+(**Note**: "*" as a property value means that the property is required but can be any value.)
+
+(**Note**: Not all output annotations are always generated.)
+
+- [http://mmif.clams.ai/vocabulary/Alignment/v1](http://mmif.clams.ai/vocabulary/Alignment/v1)
+(of any properties)
+
+- [http://mmif.clams.ai/vocabulary/TextDocument/v1](http://mmif.clams.ai/vocabulary/TextDocument/v1)
+(of any properties)
+
diff --git a/docs/_apps/llava-captioner/v1.2/metadata.json b/docs/_apps/llava-captioner/v1.2/metadata.json
@@ -0,0 +1,68 @@
+{
+  "name": "LLaVA Captioner",
+  "description": "Applies LLaVA v1.6 Mistral-7B to video frames for image captioning.",
+  "app_version": "v1.2",
+  "mmif_version": "1.0.5",
+  "app_license": "Apache 2.0",
+  "identifier": "http://apps.clams.ai/llava-captioner/v1.2",
+  "url": "https://github.com/clamsproject/app-llava-captioner",
+  "input": [
+    {
+      "@type": "http://mmif.clams.ai/vocabulary/VideoDocument/v1",
+      "required": true
+    },
+    {
+      "@type": "http://mmif.clams.ai/vocabulary/ImageDocument/v1",
+      "required": true
+    },
+    {
+      "@type": "http://mmif.clams.ai/vocabulary/TimeFrame/v5",
+      "required": true
+    }
+  ],
+  "output": [
+    {
+      "@type": "http://mmif.clams.ai/vocabulary/Alignment/v1"
+    },
+    {
+      "@type": "http://mmif.clams.ai/vocabulary/TextDocument/v1"
+    }
+  ],
+  "parameters": [
+    {
+      "name": "frameInterval",
+      "description": "The interval at which to extract frames from the video if there are no timeframe annotations. Default is every 30 frames.",
+      "type": "integer",
+      "default": 30,
+      "multivalued": false
+    },
+    {
+      "name": "defaultPrompt",
+      "description": "default prompt to use for timeframes not specified in the promptMap. If set to `-`, timeframes not specified in the promptMap will be skipped.",
+      "type": "string",
+      "default": "Describe what is shown in this video frame. Analyze the purpose of this frame in the context of a news video. Transcribe any text present.",
+      "multivalued": false
+    },
+    {
+      "name": "promptMap",
+      "description": "mapping of labels of the input timeframe annotations to new prompts. Must be formatted as \"IN_LABEL:PROMPT\" (with a colon). To pass multiple mappings, use this parameter multiple times. By default, any timeframe labels not mapped to a prompt will be used with the defaultprompt. In order to skip timeframes with a particular label, pass `-` as the prompt value.in order to skip all timeframes not specified in the promptMap, set the defaultPromptparameter to `-`",
+      "type": "map",
+      "default": [],
+      "multivalued": true
+    },
+    {
+      "name": "config",
+      "description": "Name of the config file to use.",
+      "type": "string",
+      "default": "config/default.yaml",
+      "multivalued": false
+    },
+    {
+      "name": "pretty",
+      "description": "The JSON body of the HTTP response will be re-formatted with 2-space indentation",
+      "type": "boolean",
+      "default": false,
+      "multivalued": false
+    }
+  ]
+}
diff --git a/docs/_apps/llava-captioner/v1.2/submission.json b/docs/_apps/llava-captioner/v1.2/submission.json
@@ -0,0 +1,5 @@
+{
+  "time": "2025-02-05T22:52:42+00:00",
+  "submitter": "kelleyl",
+  "image": "ghcr.io/clamsproject/app-llava-captioner:v1.2"
+}
diff --git a/docs/_data/app-index.json b/docs/_data/app-index.json
@@ -1,4 +1,22 @@
 {
+  "http://apps.clams.ai/llava-captioner": {
+    "description": "Applies llava to video frames.",
+    "latest_update": "2025-02-05T22:52:42+00:00",
+    "versions": [
+      [
+        "v1.2",
+        "kelleyl"
+      ],
+      [
+        "v1.1",
+        "kelleyl"
+      ],
+      [
+        "v1.0",
+        "kelleyl"
+      ]
+    ]
+  },
   "http://apps.clams.ai/swt-detection": {
     "description": "Detects scenes with text, like slates, chyrons and credits.",
     "latest_update": "2025-02-03T22:07:54+00:00",
@@ -243,20 +261,6 @@
       ]
     ]
   },
-  "http://apps.clams.ai/llava-captioner": {
-    "description": "Applies llava to video frames.",
-    "latest_update": "2024-05-23T19:38:32+00:00",
-    "versions": [
-      [
-        "v1.1",
-        "kelleyl"
-      ],
-      [
-        "v1.0",
-        "kelleyl"
-      ]
-    ]
-  },
   "http://apps.clams.ai/inaspeechsegmenter-wrapper": {
     "description": "inaSpeechSegmenter is a CNN-based audio segmentation toolkit. The original software can be found at https://github.com/ina-foss/inaSpeechSegmenter .",
     "latest_update": "2024-05-07T03:45:14+00:00",
diff --git a/docs/_data/apps.json b/docs/_data/apps.json