python markdownの使い方
概要
- markdownをHTMLに変換するライブラリ
- markdown形式のテーブル情報をHTMLに変換し、pandasのDataFrameに変換することができる
インストール
$ pip install markdown
使用例
import markdown
from bs4 import BeautifulSoup
import pandas as pd
from io import StringIO
markdown_text = """
# hello
## this is sample
- show table below
| Tables | Are | Cool |
| ------------- |-------------| -----|
| col 3 is | right-aligned | $1600 |
| col 2 is | centered | $12 |
| zebra stripes | are neat | $1 |
"""
# markdonwをHTMLに変換
html = markdown.markdown(markdown_text, extensions=['markdown.extensions.tables'])
# BeautifulSoupでHTMLを解析
soup = BeautifulSoup(html, 'html.parser')
# pandasのDataFrameに変換
df_list = pd.read_html(StringIO(str(soup)))
df = df_list[0]
df
"""
| | Tables | Are | Cool |
|---:|:--------------|:--------------|:-------|
| 0 | col 3 is | right-aligned | $1600 |
| 1 | col 2 is | centered | $12 |
| 2 | zebra stripes | are neat | $1 |
"""