206 lines
4.1 KiB
Bash
206 lines
4.1 KiB
Bash
|
#!/bin/bash
|
||
|
#
|
||
|
# gd-tools - a set of programs to enhance goldendict for immersion learning.
|
||
|
# Copyright (C) 2023 Ajatt-Tools
|
||
|
#
|
||
|
# This program is free software: you can redistribute it and/or modify
|
||
|
# it under the terms of the GNU General Public License as published by
|
||
|
# the Free Software Foundation, either version 3 of the License, or
|
||
|
# (at your option) any later version.
|
||
|
#
|
||
|
# This program is distributed in the hope that it will be useful,
|
||
|
# but WITHOUT ANY WARRANTY; without even the implied warranty of
|
||
|
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
||
|
# GNU General Public License for more details.
|
||
|
#
|
||
|
# You should have received a copy of the GNU General Public License
|
||
|
# along with this program. If not, see <https://www.gnu.org/licenses/>.
|
||
|
|
||
|
set -euo pipefail
|
||
|
|
||
|
# Requires installing mecab
|
||
|
# Open GoldenDict, press "Edit" > "Dictionaries" > "Programs" and add this script as type html.
|
||
|
|
||
|
TEMP_FILE=/tmp/mecab-cache
|
||
|
|
||
|
# Default path to user_dic.dic, assuming that the user ran `xmake install`.
|
||
|
USER_DICT=""
|
||
|
|
||
|
FONT_SIZE=2rem
|
||
|
GDWORD=""
|
||
|
GDSEARCH=""
|
||
|
|
||
|
sanitize_input() {
|
||
|
sed -E \
|
||
|
-e 's, +,,g' \
|
||
|
-e 's,[a-z]+, ,Ig' \
|
||
|
-e 's,\n, ,g'
|
||
|
}
|
||
|
|
||
|
usage() {
|
||
|
local -r bn=$(basename -- "$0")
|
||
|
cat <<-EOF
|
||
|
usage: $bn [OPTIONS] --word %GDWORD% --sentence %GDSEARCH%
|
||
|
|
||
|
echo input back to GoldenDict as HTML with sentence split into parts
|
||
|
|
||
|
OPTIONS
|
||
|
EOF
|
||
|
column -t -s'|' <<-EOF
|
||
|
--user-dict PATH|path to the user dictionary.
|
||
|
--font-size SIZE|font size. The default value is 30px
|
||
|
EOF
|
||
|
}
|
||
|
|
||
|
find_user_dict() {
|
||
|
find \
|
||
|
"$USER_DICT" \
|
||
|
/usr/share/gd-tools/user_dic.dic \
|
||
|
~/.local/share/gd-tools/user_dic.dic \
|
||
|
-type f -print -quit 2>/dev/null
|
||
|
}
|
||
|
|
||
|
find_dicdir() {
|
||
|
dirname -- "$(
|
||
|
find \
|
||
|
/usr/lib/mecab/dic/mecab-ipadic-neologd \
|
||
|
/usr/lib/mecab/dic \
|
||
|
~/.local/share/Anki2/addons21 \
|
||
|
-type f -name dicrc -print -quit 2>/dev/null
|
||
|
)"
|
||
|
}
|
||
|
|
||
|
mecab_split() {
|
||
|
if ! command -v mecab &>/dev/null; then
|
||
|
echo "Error: MeCab is not installed. Please install MeCab and try again."
|
||
|
exit 1
|
||
|
fi
|
||
|
|
||
|
local -r user_dict=$(find_user_dict)
|
||
|
local -a args=(
|
||
|
mecab
|
||
|
--node-format='<a href="bword:%f[6]">%m</a>'
|
||
|
--unk-format='<a href="bword:%m">%m</a>'
|
||
|
--eos-format='<br>'
|
||
|
--dicdir="$(find_dicdir)"
|
||
|
--userdic="${USER_DICT}"
|
||
|
)
|
||
|
if [[ -n $user_dict ]]; then
|
||
|
args+=("$user_dict")
|
||
|
fi
|
||
|
"${args[@]}"
|
||
|
}
|
||
|
|
||
|
print_css() {
|
||
|
cat <<-EOF
|
||
|
<style>
|
||
|
* {
|
||
|
margin: 0;
|
||
|
padding: 0;
|
||
|
}
|
||
|
.gd-mecab {
|
||
|
font-size: ${FONT_SIZE:-2rem};
|
||
|
color: #1268c3;
|
||
|
font-weight: normal;
|
||
|
}
|
||
|
.gd-mecab a {
|
||
|
display: inline-block;
|
||
|
font-weight: normal;
|
||
|
color: royalblue;
|
||
|
text-decoration: none;
|
||
|
}
|
||
|
.gd-mecab a:not(:last-of-type)::after {
|
||
|
content: "";
|
||
|
display: inline-block;
|
||
|
background-color: #333;
|
||
|
margin: 4px;
|
||
|
width: 3px;
|
||
|
height: 3px;
|
||
|
border-radius: 100vmax;
|
||
|
vertical-align: middle;
|
||
|
cursor: text;
|
||
|
user-select: text;
|
||
|
}
|
||
|
.gd-mecab a b {
|
||
|
background-color: #ddeeff;
|
||
|
border-radius: 0.2rem;
|
||
|
font-weight: 500;
|
||
|
}
|
||
|
</style>
|
||
|
EOF
|
||
|
}
|
||
|
|
||
|
highlight_word() {
|
||
|
local target_word=$* search=""
|
||
|
search=$(cat -- -)
|
||
|
search=${search//">$target_word<"/"><b>${target_word}</b><"}
|
||
|
echo "$search"
|
||
|
}
|
||
|
|
||
|
die() {
|
||
|
echo "$*" >&2
|
||
|
notify-send "$(basename -- "$0")" "$*" &
|
||
|
exit 1
|
||
|
}
|
||
|
|
||
|
main() {
|
||
|
if (($# == 0)) || [[ $* == --help ]] || [[ $* == -h ]]; then
|
||
|
usage
|
||
|
exit
|
||
|
fi
|
||
|
while (($# > 0)); do
|
||
|
case $1 in
|
||
|
--font-size)
|
||
|
shift
|
||
|
FONT_SIZE=$1
|
||
|
;;
|
||
|
--user-dict)
|
||
|
shift
|
||
|
USER_DICT=$1
|
||
|
;;
|
||
|
--word)
|
||
|
shift
|
||
|
GDWORD=$1
|
||
|
;;
|
||
|
--sentence)
|
||
|
shift
|
||
|
GDSEARCH=$1
|
||
|
;;
|
||
|
*)
|
||
|
die "Invalid argument passed."
|
||
|
;;
|
||
|
esac
|
||
|
shift
|
||
|
done
|
||
|
|
||
|
if [[ -n $USER_DICT ]] && ! [[ -f $USER_DICT ]]; then
|
||
|
die "Provided user dictionary doesn't exist or isn't a file."
|
||
|
fi
|
||
|
|
||
|
if [[ -z $GDSEARCH ]] || [[ -z $GDWORD ]]; then
|
||
|
die "Not enough parameters."
|
||
|
fi
|
||
|
|
||
|
local -r input=$(echo "$GDSEARCH" | sanitize_input)
|
||
|
local -r output=$(grep -Fxs -A1 "$input" -- "$TEMP_FILE")
|
||
|
|
||
|
echo '<div class="gd-mecab">'
|
||
|
if [[ -n $output ]]; then
|
||
|
echo "$output" |
|
||
|
tail -1 |
|
||
|
highlight_word "$GDWORD"
|
||
|
else
|
||
|
echo "$input" |
|
||
|
tee -a "$TEMP_FILE" |
|
||
|
mecab_split |
|
||
|
tee -a "$TEMP_FILE" |
|
||
|
highlight_word "$GDWORD"
|
||
|
printf -- '\n\n' >>"$TEMP_FILE"
|
||
|
fi
|
||
|
echo '</div>'
|
||
|
|
||
|
print_css
|
||
|
}
|
||
|
|
||
|
main "$@"
|