LangChain-OpenTutorial
diff --git a/‎css/styles.css
Lines changed: 15 additions & 0 deletions b/‎css/styles.css
Lines changed: 15 additions & 0 deletions
diff --git a/‎mdconverter/__init__.py b/‎mdconverter/__init__.py
diff --git a/‎mdconverter/mdconverter.py
Lines changed: 129 additions & 0 deletions b/‎mdconverter/mdconverter.py
Lines changed: 129 additions & 0 deletions
diff --git a/‎mdconverter/mdconverter_class.py
Lines changed: 50 additions & 0 deletions b/‎mdconverter/mdconverter_class.py
Lines changed: 50 additions & 0 deletions
diff --git a/‎sample/05-GoogleGenerativeAI-(NEED-REVIEW).md
Lines changed: 7 additions & 8 deletions b/‎sample/05-GoogleGenerativeAI-(NEED-REVIEW).md
Lines changed: 7 additions & 8 deletions
@@ -0,0 +1,15 @@
+.custom {
+    background-color: #008d8d;
+    color: white;
+    padding: 0.25em 0.5em 0.25em 0.5em;
+    white-space: pre-wrap;       /* css-3 */
+    white-space: -moz-pre-wrap;  /* Mozilla, since 1999 */
+    white-space: -pre-wrap;      /* Opera 4-6 */
+    white-space: -o-pre-wrap;    /* Opera 7 */
+    word-wrap: break-word;
+}
+
+pre {
+    background-color: #027c7c;
+    padding-left: 0.5em;
+}
@@ -0,0 +1,129 @@
+import codecs
+import json
+import argparse
+from typing import List, Dict, Any, Optional
+
+
+def get_default_css(css_filename: str) -> str:
+    """기본 CSS 스타일을 반환합니다."""
+    try:
+        with open(css_filename, "r", encoding="utf-8") as f:
+            css_content = f.read()
+        return f"<style>\n{css_content}\n</style>"
+    except FileNotFoundError:
+        print("Could not find styles.css file.")
+        return ""
+
+
+def _read_notebook_file(filename: str) -> Dict[str, Any]:
+    """노트북 파일을 읽어서 JSON으로 파싱합니다."""
+    try:
+        with codecs.open(filename, "r") as f:
+            source = f.read()
+    except UnicodeDecodeError:
+        with codecs.open(filename, "r", encoding="utf-8") as f:
+            source = f.read()
+    except Exception as e:
+        raise Exception(f"파일 변환에 실패했습니다. 에러 메시지: {str(e)}")
+
+    return json.loads(source)
+
+
+def _process_code_output(output: Dict[str, Any], cells: List[str]) -> None:
+    """코드 셀의 출력을 처리합니다."""
+    if "data" in output:
+        outputs_data = output["data"]
+        for key, value in outputs_data.items():
+            if key == "text/html":
+                v = [v_.replace("\n", "") for v_ in value]
+                cells.extend(v)
+                cells.append("\n")
+                break
+            elif key == "text/plain":
+                v = [v_.replace("\n", "") for v_ in value]
+                v.insert(0, '<pre class="custom">')
+                v.append("</pre>")
+                cells.extend(v)
+                cells.append("\n\n")
+                break
+            elif key == "image/png":
+                plain_image = '<img src="data:image/png;base64,{}"/>\n'.format(
+                    value.replace("\n", "")
+                )
+
+                cells.append(plain_image)
+                cells.append("\n\n")
+                break
+    elif output.get("output_type") == "stream":
+        v = output["text"]
+        v.insert(0, '<pre class="custom">')
+        v.append("</pre>\n\n")
+        cells.extend(v)
+
+
+def _process_code_cell(cell: Dict[str, Any], cells: List[str]) -> None:
+    """코드 셀을 처리합니다."""
+    work_flag = True
+
+    if "source" in cell:
+        cells.append("\n```python\n")
+        cells.extend(cell["source"])
+        cells.append("\n```\n")
+        work_flag = False
+
+    outputs = cell["outputs"]
+    if outputs:
+        for output in outputs:
+            _process_code_output(output, cells)
+    elif work_flag:
+        cells.append("\n```python")
+        code = [c.replace("\n", "") for c in cell["source"]]
+        cells.extend(code)
+        cells.append("```\n\n")
+
+
+def _process_converter(filename: str, output_filename: str, css_filename: str) -> str:
+    """노트북을 마크다운으로 변환합니다."""
+    notebook = _read_notebook_file(filename)
+    cells: List[str] = []
+
+    for cell in notebook["cells"]:
+        if cell["cell_type"] == "code":
+            _process_code_cell(cell, cells)
+        elif cell["cell_type"] == "markdown":
+            cells.extend(cell["source"])
+            cells.append("\n")
+        else:
+            print(f"Unknown cell type. Verification Needed. file : {filename}")
+
+    final_output = f"{get_default_css(css_filename)}\n\n{''.join(cells)}"
+
+    with open(output_filename, "w") as f:
+        f.write(final_output)
+
+    return output_filename
+
+
+def convert_markdown_from_notebook(
+    filename: str,
+    css_filename: str = "css/styles.css",
+    post_fix: str = "-(NEED-REVIEW)",
+) -> str:
+    """노트북 파일을 마크다운으로 변환하는 메인 함수입니다."""
+
+    output_filename = filename.replace(".ipynb", f"{post_fix}.md")
+
+    return _process_converter(filename, output_filename, css_filename)
+
+
+if __name__ == "__main__":
+    parser = argparse.ArgumentParser(
+        description="주피터 노트북을 마크다운으로 변환합니다."
+    )
+    parser.add_argument(
+        "--filename", required=True, help="변환할 주피터 노트북 파일 경로"
+    )
+    parser.add_argument("--css", default="css/styles.css", help="css file path")
+    args = parser.parse_args()
+
+    convert_markdown_from_notebook(args.filename)
@@ -0,0 +1,50 @@
+from typing import Any
+from mdconverter.mdconverter import get_default_css
+from nbconvert import MarkdownExporter
+import nbformat
+
+
+class Mdconverter:
+    def __init__(self) -> None:
+        self.css_filename = ""
+        self.filename = ""
+        self.output_filename = ""
+
+    def run(self):
+        # TODO making mdconverter using mdconvert.py
+        # self.run_mdconverter()
+        self.run_ndconverter(
+            filename=self.filename,
+            output_filename=self.output_filename,
+            css_filename=self.css_filename,
+        )
+
+    def run_ndconverter(
+        self, filename: str, output_filename: str, css_filename: str
+    ) -> None:
+        notebook_content = self.load_ipynb(filename)
+        script = self.markdown_exporter(notebook_content)
+        self.ndconverter_script = self.add_prefix_css(script, css_filename)
+        self.save_script(self.ndconverter_script, output_filename)
+
+    def load_ipynb(self, filename: str) -> Any:
+        with open(filename, "r", encoding="utf-8") as f:
+            notebook_content = nbformat.read(f, as_version=4)
+        return notebook_content
+
+    def markdown_exporter(self, notebook_content: Any) -> str:
+        exporter = MarkdownExporter()
+        # MarkdownExporter를 사용하여 md로 변환
+        (script, resources) = exporter.from_notebook_node(notebook_content)
+        return script
+
+    def add_prefix_css(self, script: str, css_filename: str):
+        return f"{get_default_css(css_filename)}\n\n{''.join(script)}"
+
+    def save_script(self, script: str, output_filename: str) -> None:
+        # 변환된 스크립트 저장
+        with open(output_filename, "w", encoding="utf-8") as f:
+            f.write(script)
+
+
+# TODO Creating Multi loader
@@ -7,9 +7,9 @@
         white-space: -moz-pre-wrap;  /* Mozilla, since 1999 */
         white-space: -pre-wrap;      /* Opera 4-6 */
         white-space: -o-pre-wrap;    /* Opera 7 */
-        word-wrap: break-word;    
+        word-wrap: break-word;
     }
-    
+
     pre {
         background-color: #027c7c;
         padding-left: 0.5em;
@@ -19,8 +19,8 @@
 # Google Generative AI
 
 - Author: [HyeonJong Moon](https://github.com/hj0302)
-- Design: 
-- Peer Review: 
+- Design:
+- Peer Review:
 - This is a part of [LangChain Open Tutorial](https://github.com/LangChain-OpenTutorial/LangChain-OpenTutorial)
 
 [![Open in Colab](https://colab.research.google.com/assets/colab-badge.svg)](https://colab.research.google.com/github/langchain-ai/langchain-academy/blob/main/module-4/sub-graph.ipynb) [![Open in LangChain Academy](https://cdn.prod.website-files.com/65b8cd72835ceeacd4449a53/66e9eba12c7b7688aa3dbb5e_LCA-badge-green.svg)](https://academy.langchain.com/courses/take/intro-to-langgraph/lessons/58239937-lesson-2-sub-graphs)
@@ -48,7 +48,7 @@ You can use the `ChatGoogleGenerativeAI` class from the [langchain-google-genai]
 Set up the environment. You may refer to [Environment Setup](https://wikidocs.net/257836) for more details.
 
 **[Note]**
-- `langchain-opentutorial` is a package that provides a set of easy-to-use environment setup, useful functions and utilities for tutorials. 
+- `langchain-opentutorial` is a package that provides a set of easy-to-use environment setup, useful functions and utilities for tutorials.
 - You can checkout the [`langchain-opentutorial`](https://github.com/LangChain-OpenTutorial/langchain-opentutorial-pypi) for more details.
 
 ```python
@@ -91,7 +91,7 @@ set_env(
 
 - Please create an API KEY from [link](https://aistudio.google.com/app/apikey?hl=en).
 - Set the user's Google API key as the environment variable `GOOGLE_API_KEY`.
-You can alternatively set `GOOGLE_API_KEY` in `.env` file and load it. 
+You can alternatively set `GOOGLE_API_KEY` in `.env` file and load it.
 
 [Note] This is not necessary if you've already set `GOOGLE_API_KEY` in previous steps.
 
@@ -108,7 +108,7 @@ Import the `ChatGoogleGenerativeAI` class from the `langchain_google_genai` pack
 
 The `ChatGoogleGenerativeAI` class is used to implement conversational AI systems using Google’s Generative AI models. Through this class, users can interact with Google’s conversational AI model. Conversations with the model take place in a chat format, and the model generates appropriate responses based on user input.
 
-Because the `ChatGoogleGenerativeAI` class is integrated with the LangChain framework, it can be used alongside other LangChain components. 
+Because the `ChatGoogleGenerativeAI` class is integrated with the LangChain framework, it can be used alongside other LangChain components.
 
 For information about supported models, see: https://ai.google.dev/gemini-api/docs/models/gemini?hl=en
 
@@ -336,4 +336,3 @@ print(response.content)
 <pre class="custom">That's a picture of the Matterhorn mountain in Switzerland.  The image shows the iconic pyramidal peak covered in snow, set against a dramatic, softly colored sunset or sunrise sky.  The foreground features a gently sloping snow-covered landscape.
 
 </pre>
-