python,pandoc,luaフィルタで、太字(**)＆指定font機能を実現し、docxファイルに書き込みたい

Question

### 実現したいこと ①mdファイルの中に表がある。表の中には太字(＊＊)がないものもあり、pythonで＊＊を追記して、太字にしてdocxに書き込みたい。 ②luaフィルタで、fontの場合、指定したsize,colorをdocxに書き込みたい。 ### 発生している問題・分からないこと ①pythonで太字(＊＊)を追記して修正できているが、それが表になっていない。原因はpandocが修正した表を認識しないからというのは理解できる。しかし、fix.luaでどのように実現方法がわからない。 ②fix.luaで print(color),print(size)の結果、値は取得できている。しかし、docxファイルを見てみると、指定の色やサイズになっていない。 ### 該当のソースコード ```python(main.py) # ■■ Pandocインストール必要(https://github.com/jgm/pandoc/releases/tag/3.6.4) import os, re import subprocess from docx import Document import time # Markdownの整形処理 def md_edit(md_file_path, temp_file_path): with open(md_file_path, 'r', encoding='utf-8') as infile, open(temp_file_path, 'w', encoding='utf-8') as outfile: prev_line_flg = False for line in infile: # リンク内のスペース除外 if '', start_index) name_content = line[start_index:end_index].replace(' ', '').replace('　', '') line = line[:start_index] + name_content + line[end_index:] # URL以外は、リンク内のスペース除外 if '](' in line and ')' in line and 'http' not in line: start_index = line.find('](') + len('](') end_index = line.find(')', start_index) link_content = line[start_index:end_index].replace(' ', '').replace('　', '') line = line[:start_index] + link_content + line[end_index:] # 行の先頭が<で次に英語または/以外の文字が続く場合、<を＜に置換し、同じ行の次の>を＞に置換 if re.match(r'^<[^a-zA-Z/]', line): line = line.replace('<', '＜', 1) line = line.replace('>', '＞', 1) # "#"から始まる対象は、前回が空でなければ改行を追加 if line.startswith('#') and prev_line_flg: outfile.write(' ') # 改行追加 # ">"のみの対象は、半角スペースを追加 if line.strip() == '>': line = '> ' # 行の末尾が"
"または"
"の場合、除外 if line.rstrip().endswith('
') and line.strip() != '
': line = line.rstrip()[:-4] + ' ' elif line.rstrip().endswith('
') and line.strip() != '
': line = line.rstrip()[:-5] + ' ' # 2025/04/29 全角スペースがあるときは、半角スペースに置換 if '　' in line.strip(): line = line.replace('　',' ') #2025/05/21 表の中の太字修正 # if ("|" in line.strip()) and ("| --" not in line.strip()) and ("jpg" not in line.strip()): # parts = line.split("|")[1:-1] # '',' 'を削除(スライス) # new_parts = [] # for part in parts: # part = part.strip() # if ("*" in part) and ("**" not in part): # part = part.replace("*","**") # *が1つ存在するときもあるので修正 # elif "*" not in part: # part = f"**{part}**" # *が存在しないとき**追加 # new_parts.append(part) # line = "| " + " | ".join(new_parts) + " |" outfile.write(line) # 行反映 # 改行のみであったかチェック if line == ' ': prev_line_flg = False else: prev_line_flg = True # Word編集処理 def word_edit(docx_file_path): document = Document(docx_file_path) for paragraph in document.paragraphs: if paragraph.text.startswith('> '): paragraph.style = 'Quote' paragraph.text = paragraph.text[2:] document.save(docx_file_path) def main(): try: # ◆Markdownファイルリスト in_dir = "in" md_file_lists = list(filter(lambda f: f.endswith(".md"), os.listdir(in_dir))) # ◆ディレクトリ直下のカスタムテンプレートファイル # Wordのスタイルウィンドウを出して、出力したいスタイルのテンプレートを作成 template_file = "template.docx" # ◆出力ディレクトリ out_dir = "out" # ◆出力ディレクトリが存在しない場合は作成 if not os.path.exists(out_dir): os.makedirs(out_dir) # ◆Pandocコマンド実行 if md_file_lists: for i, md_file in enumerate(md_file_lists): input_file_path = os.path.join(in_dir, md_file) # インプットファイルパス作成 temp_file_path = os.path.join(in_dir, 'temp_' + md_file) # 一時ファイルパス作成 output_file_path = os.path.join(out_dir, os.path.splitext(os.path.basename(md_file))[0] + ".docx") # アウトプットファイルパス作成 md_edit(input_file_path, temp_file_path) # Markdownファイル整形 if template_file != "": # ◇テンプレート指定あり cmd = [ "pandoc", temp_file_path, "--reference-doc", template_file, "--lua-filter=fix.lua", "--wrap=preserve", "-o", output_file_path ] else: # ◇テンプレート指定なし cmd = [ "pandoc", temp_file_path, "--lua-filter=fix.lua", "--wrap=preserve", "-o", output_file_path ] result = subprocess.run(cmd, capture_output=True, text=True) # Pandoc実行 if result.returncode != 0: raise Exception(f"変換異常発生: {result.stderr} >{md_file}") word_edit(output_file_path) # word編集 os.remove(temp_file_path) # 一時ファイル削除 if i == 0: print("【変換対象ファイル一覧】") print(f"{i+1}: {md_file}") print("-- 変換完了 --") else: print("-- MDファイルなし --") except Exception as err: print(err) if __name__ == '__main__': main() ``` ```luaフィルタ(fix.lua) local b_cnt = 0 -- ブロック処理 function RawBlock(el) -- 改ページ処理 if el.text == '

' then return pandoc.RawBlock('openxml', '') else return el end end -- インライン処理 function RawInline(el) -- 2025/05/19下線処理 if el.text == '' then return pandoc.RawInline('openxml', '') -- 2025/05/19下線処理 elseif el.text == '' then return pandoc.RawInline('openxml', '') -- 改行処理 elseif el.text == '
' or el.text == '
' then return pandoc.RawInline('openxml', '') -- ブックマーク処理 elseif el.text:match('') then local b_name = el.text:match('') b_cnt = b_cnt + 1 return pandoc.RawInline('openxml', '') -- font処理 size,colorの場合がある。（問題部分はここ） elseif el.text:find("' end if size then -- OpenXML のフォントサイズは半ポイント単位（例: size=2 → 16pt → val="32"） local size_val = tonumber(size) and tostring(tonumber(size) * 8) or nil if size_val then openxml = openxml .. '' end end openxml = openxml .. '' return pandoc.RawInline('openxml', openxml) elseif el.text == '' then --print(el.text) return pandoc.RawInline('openxml', '') else return el end end -- リンク処理 function Link(el) if el.target:match("^#") then b_cnt = b_cnt + 1 local b_name = el.target:sub(2):gsub("%%20", " ") local content = pandoc.utils.stringify(el.content) return { pandoc.RawInline('openxml', ''),pandoc.RawInline('openxml', '' .. content .. ''), pandoc.RawInline('openxml', '') } else return el end end ``` ```sample.md | アイウエオ |　(pythonでアイウエオに**をつけて太字にしたい) | ------------------------------------------------------------ | | *ユーザー名：〜〜〜*
*パスワード：〜〜〜* |　(pythonで*を**にしたい) | **カキクケコ** |　(カキクケコは問題ない) | *担当者ID：〜〜〜*
* パスワード：〜〜〜* |　(pythonで*を**にしたい) ``` ### 試したこと・調べたこと - [ ] teratailやGoogle等で検索した - [x] ソースコードを自分なりに変更した - [ ] 知人に聞いた - [ ] その他 ##### 上記の詳細・結果 python,luaフィルタのコードのエラーはなく、docxファイルは作成される。 ①上記のコードを書いたが、表になっていない。 ②指定の色やサイズになっていない。 ### 補足 python 3.8.10 pandoc 3.6.4 OS:Windows

Answer

私が質問の意図を取り違えていたらすいません。

後述のコードではテーブルの先頭行を強調するのと
```text
*なにかの文字列*
``` 
を
```text
**なにかの文字列**
``` 
のように単体の * を2個の ** として置き換えるコードを提案しています。
（こちらについては Copilot に訪ねたのを白状しておきます）

以下はコードの修正点です。

md_edit メソッド内を2箇所修正することとなります。
```python
        prev_line_flg = False
```
の行の下に以下のコード、
```python
        table_begins = False # テーブルの先頭行で True になる
```
そして
```python
            outfile.write(line) # 行反映
```
の行の上に以下のコード
```python
            # 2025/05/30 ＋＋＋＋＋＋＋＋＋＋＋＋ここから
            # テーブル見出しを強調する
            table_header = line
            if not table_begins and re.search(r'^\| +', table_header):
                table_header = re.sub('^(\| +)', '\1**', table_header)
                table_header = re.sub('( +\|)', '**\1', table_header)
                line = table_header
                table_begins = True
            elif table_begins and re.search(r'^\| +', table_header) == None:
                table_begins = False

# * を ** に置き換える
            line = re.sub('(?<!\*)\*(?!\*)', '**', line)
            # 2025/05/30 ＋＋＋＋＋＋＋＋＋＋＋＋ここまで
```
を加えてください。

実現したいこと

発生している問題・分からないこと

該当のソースコード

試したこと・調べたこと

上記の詳細・結果

補足

関連した質問