hesychius: fix long entries upstream and handle them here
This commit is contained in:
@@ -5,5 +5,5 @@ root=https://el.wikisource.org
|
|||||||
curl -sSL "$root/wiki/%CE%93%CE%BB%CF%8E%CF%83%CF%83%CE%B1%CE%B9" \
|
curl -sSL "$root/wiki/%CE%93%CE%BB%CF%8E%CF%83%CF%83%CE%B1%CE%B9" \
|
||||||
| htmlq --attribute href 'ol li a[title^="Γλ"]' \
|
| htmlq --attribute href 'ol li a[title^="Γλ"]' \
|
||||||
| while read -r slug; do
|
| while read -r slug; do
|
||||||
curl -sSL "$root$slug" | htmlq dd | sed 's#</\?dd>##g;s#<#<#g;s#>#>#g'
|
curl -sSL "$root$slug" | htmlq dt,dd | tr -d '\n' | sed 's#\(<dt>\)#\n\1#g;s#<dt>\|</dd>##g;s#</dt><dd>#· #g;s#<#<#g;s#>#>#g'
|
||||||
done
|
done
|
||||||
|
|||||||
13732
hesychius/hesychius.txt
13732
hesychius/hesychius.txt
File diff suppressed because it is too large
Load Diff
Reference in New Issue
Block a user