summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorhaturatu <taro@eyes4you.org>2024-10-09 01:36:19 +0900
committerhaturatu <taro@eyes4you.org>2024-10-09 01:36:19 +0900
commit031b8014901bd101d92af148a841e9b9c8fb59f5 (patch)
treee284928681323b7bebf08f34bb15db8a11a20f5c
parent736e6f490c6a9555141188c78c6aa48782d3b5b6 (diff)
fi
-rwxr-xr-xgeturl.rb4
-rwxr-xr-xmd.rb4
2 files changed, 4 insertions, 4 deletions
diff --git a/geturl.rb b/geturl.rb
index 804ed91..c5422c3 100755
--- a/geturl.rb
+++ b/geturl.rb
@@ -7,7 +7,7 @@ require 'nokogiri'
require 'charlock_holmes'
require 'unicode_utils'
-$FILE_PATH = './ok'
+$FILE_PATH = '/Your/URLs/list/file'
$RESULT_FILE = 'Result'
$OTHER_ERROR_FILE = 'Other'
$CONCURRENCY = 10
@@ -17,7 +17,7 @@ def is_garbled?(text)
end
def clean_title(title)
- title = title.chars.reject { |ch| UnicodeUtils.general_category(ch).start_with?('C') && !['(', ')', '[', ']', '{', '}', '【', '】', '「', '」', '(' ,')' ].include?(ch) }.join
+ title = title.chars.reject { |ch| UnicodeUtils.general_category(ch).start_with?('C') && !['(', ')', '[', ']', '{', '}', '【', '】', '【', '】', '「', '」', '(' ,')' ].include?(ch) }.join
title = UnicodeUtils.nfkc(title)
title = title.chars.select(&:valid_encoding?).join
title.strip
diff --git a/md.rb b/md.rb
index 1a8da2b..24c2eb4 100755
--- a/md.rb
+++ b/md.rb
@@ -3,7 +3,7 @@
def convert_to_markdown(input_file, output_file)
content = File.read(input_file, encoding: 'utf-8')
- pairs = content.scan(/URL: (.*?)\nTitle: (.*?)\n/m)
+ pairs = content.scan(/URL: (.*?)\nタイトル: (.*?)\n/m)
File.open(output_file, 'w', encoding: 'utf-8') do |f|
pairs.each do |url, title|
@@ -14,7 +14,7 @@ def convert_to_markdown(input_file, output_file)
title = url.split('/')[-1] if title.strip.empty?
# 特殊文字をエスケープ
- title = title.gsub('[', '\\[').gsub(']', '\\]')
+ title = title.gsub(/[\[\]\(\)\{\}]/) { |m| "\\#{m}" }
# md形式のリンクを作成
markdown_link = "[#{title}](#{url})\n\n"