Merge pull request sumanth-0#814 from aniruddhaadak9/feature/simple-markdown-converter-789

sumanth-0 · web-flow · commit d5c8801deee1 · 2025-10-12T21:17:01.000+05:30
Add Simple Markdown Converter - Fixes sumanth-0#789
diff --git a/snippets/simple_markdown_converter/README.md b/snippets/simple_markdown_converter/README.md
@@ -0,0 +1,78 @@
+# Simple Markdown Converter
+
+A lightweight Python utility to convert Markdown files to HTML or plain text format.
+
+## Description
+
+This tool converts Markdown-formatted text files into HTML or plain text, supporting common Markdown elements including headers, lists, bold/italic text, links, and code blocks.
+
+## Features
+
+- **Headers**: Supports H1 through H6 headers
+- **Lists**: Converts unordered lists (*, -)
+- **Text Formatting**: Bold (**text**) and italic (*text*)
+- **Links**: Converts [text](url) format
+- **Code**: Both inline `code` and code blocks (```)
+- **Output Formats**: HTML or plain text
+
+## Usage
+
+### Basic Usage
+
+```bash
+# Convert to HTML (default)
+python simple_markdown_converter.py input.md
+
+# Convert to plain text
+python simple_markdown_converter.py input.md -f text
+
+# Save output to file
+python simple_markdown_converter.py input.md -o output.html
+python simple_markdown_converter.py input.md -f text -o output.txt
+```
+
+### Command Line Arguments
+
+- `input_file`: Path to the input Markdown file (required)
+- `-o, --output`: Output file path (optional, defaults to stdout)
+- `-f, --format`: Output format - 'html' or 'text' (default: html)
+
+## Example
+
+**Input (example.md):**
+```markdown
+# My Document
+
+This is a **bold** statement and this is *italic*.
+
+## Features
+- First item
+- Second item
+
+Visit [GitHub](https://github.com)
+```
+
+**Output (HTML):**
+```html
+<h1>My Document</h1>
+<p>This is a <strong>bold</strong> statement and this is <em>italic</em>.</p>
+<h2>Features</h2>
+<ul>
+<li>First item</li>
+<li>Second item</li>
+</ul>
+<p>Visit <a href="https://github.com">GitHub</a></p>
+```
+
+## Requirements
+
+- Python 3.6 or higher
+- No external dependencies (uses only standard library)
+
+## Author
+
+Created as part of the 100 Lines of Python Code project.
+
+## Issue Reference
+
+Addresses Issue #789 - Simple Markdown Converter
diff --git a/snippets/simple_markdown_converter/simple_markdown_converter.py b/snippets/simple_markdown_converter/simple_markdown_converter.py
@@ -0,0 +1,136 @@
+#!/usr/bin/env python3
+"""
+Simple Markdown Converter
+Converts Markdown to HTML and plain text formats.
+Supports headers, lists, bold, italic, links, and code blocks.
+"""
+
+import re
+import sys
+import argparse
+
+
+class MarkdownConverter:
+    """A simple Markdown to HTML/plaintext converter."""
+    
+    def __init__(self):
+        self.html_output = []
+        self.text_output = []
+    
+    def convert_to_html(self, markdown_text):
+        """Convert markdown text to HTML."""
+        lines = markdown_text.split('\n')
+        in_code_block = False
+        in_list = False
+        
+        for line in lines:
+            # Handle code blocks
+            if line.strip().startswith('```'):
+                if in_code_block:
+                    self.html_output.append('</code></pre>')
+                    in_code_block = False
+                else:
+                    self.html_output.append('<pre><code>')
+                    in_code_block = True
+                continue
+            
+            if in_code_block:
+                self.html_output.append(line)
+                continue
+            
+            # Handle headers
+            header_match = re.match(r'^(#{1,6})\s+(.+)$', line)
+            if header_match:
+                level = len(header_match.group(1))
+                content = header_match.group(2)
+                content = self._process_inline(content)
+                self.html_output.append(f'<h{level}>{content}</h{level}>')
+                continue
+            
+            # Handle unordered lists
+            if re.match(r'^[*-]\s+', line):
+                if not in_list:
+                    self.html_output.append('<ul>')
+                    in_list = True
+                content = re.sub(r'^[*-]\s+', '', line)
+                content = self._process_inline(content)
+                self.html_output.append(f'<li>{content}</li>')
+                continue
+            else:
+                if in_list:
+                    self.html_output.append('</ul>')
+                    in_list = False
+            
+            # Handle empty lines
+            if not line.strip():
+                self.html_output.append('<br>')
+                continue
+            
+            # Handle regular paragraphs
+            processed_line = self._process_inline(line)
+            self.html_output.append(f'<p>{processed_line}</p>')
+        
+        # Close any open list
+        if in_list:
+            self.html_output.append('</ul>')
+        
+        return '\n'.join(self.html_output)
+    
+    def _process_inline(self, text):
+        """Process inline markdown elements like bold, italic, links."""
+        # Bold
+        text = re.sub(r'\*\*(.+?)\*\*', r'<strong>\1</strong>', text)
+        # Italic
+        text = re.sub(r'\*(.+?)\*', r'<em>\1</em>', text)
+        # Links
+        text = re.sub(r'\[(.+?)\]\((.+?)\)', r'<a href="\2">\1</a>', text)
+        # Inline code
+        text = re.sub(r'`(.+?)`', r'<code>\1</code>', text)
+        return text
+    
+    def convert_to_plaintext(self, markdown_text):
+        """Convert markdown text to plain text (strip formatting)."""
+        lines = markdown_text.split('\n')
+        
+        for line in lines:
+            # Remove markdown syntax
+            line = re.sub(r'^#{1,6}\s+', '', line)  # Headers
+            line = re.sub(r'^[*-]\s+', '• ', line)  # Lists
+            line = re.sub(r'\*\*(.+?)\*\*', r'\1', line)  # Bold
+            line = re.sub(r'\*(.+?)\*', r'\1', line)  # Italic
+            line = re.sub(r'\[(.+?)\]\((.+?)\)', r'\1', line)  # Links
+            line = re.sub(r'`(.+?)`', r'\1', line)  # Code
+            self.text_output.append(line)
+        
+        return '\n'.join(self.text_output)
+
+
+if __name__ == '__main__':
+    parser = argparse.ArgumentParser(description='Convert Markdown to HTML or plain text')
+    parser.add_argument('input_file', help='Input markdown file')
+    parser.add_argument('-o', '--output', help='Output file (default: stdout)')
+    parser.add_argument('-f', '--format', choices=['html', 'text'], default='html',
+                        help='Output format (default: html)')
+    
+    args = parser.parse_args()
+    
+    try:
+        with open(args.input_file, 'r', encoding='utf-8') as f:
+            markdown_content = f.read()
+    except FileNotFoundError:
+        print(f'Error: File {args.input_file} not found')
+        sys.exit(1)
+    
+    converter = MarkdownConverter()
+    
+    if args.format == 'html':
+        result = converter.convert_to_html(markdown_content)
+    else:
+        result = converter.convert_to_plaintext(markdown_content)
+    
+    if args.output:
+        with open(args.output, 'w', encoding='utf-8') as f:
+            f.write(result)
+        print(f'Output written to {args.output}')
+    else:
+        print(result)