o
    Xεi                     @   s2   d Z ddlZddlZdd Zedkre  dS dS )z9Converts a Phonetisaurus G2P corpus to an sqlite database    Nc                  C   sd  t jdd} | jdddd | jdddd | jd	d
dd |  }t|j}i }t|jddd<}|D ]1}|	 }|s>q5d}|
 }|D ]}|
d\}	}
|	
d}|d|7 }qF|rf||vrf|||< q5W d   n1 sqw   Y  |& |js|d |d | D ]\}}|d||f qW d   n1 sw   Y  tdt|d|j dS )zMain entry pointzcorpus2db.py)progz--corpusTz%Phonetisaurus G2P corpus file to read)requiredhelpz
--databasezSQLite database to writez	--no-drop
store_truez(Don't drop existing g2p_alignments table)actionr   rzutf-8)encoding }|Nz#DROP TABLE IF EXISTS g2p_alignmentszlCREATE TABLE IF NOT EXISTS g2p_alignments (id INTEGER PRIMARY KEY AUTOINCREMENT, word TEXT, alignment TEXT);z:INSERT INTO g2p_alignments (word, alignment) VALUES (?, ?)Addedzalignments to)argparseArgumentParseradd_argument
parse_argssqlite3connectdatabaseopencorpusstripsplitjoinno_dropexecuteitemsprintlen)parserargsconng2p_alignmentscorpus_filelinewordpartspartpart_in	_part_outpart_ins	alignment r+   C/home/ubuntu/.local/lib/python3.10/site-packages/gruut/corpus2db.pymain	   sV   

r-   __main__)__doc__r   r   r-   __name__r+   r+   r+   r,   <module>   s   >
