Upstream's implementation has been merged a while ago and is the preferred way to set fields, as it is the only one compatible with upstream and is more user-friendly. This commit deletes the legacy glitch-soc FrontMatter functionality in order to clean up the code and make it easier to maintain.master
parent
c4bec9263c
commit
88b593a63f
@ -1,223 +0,0 @@ |
|||||||
# frozen_string_literal: true |
|
||||||
|
|
||||||
require 'singleton' |
|
||||||
|
|
||||||
# See also `app/javascript/features/account/util/bio_metadata.js`. |
|
||||||
|
|
||||||
class FrontmatterHandler |
|
||||||
include Singleton |
|
||||||
|
|
||||||
# CONVENIENCE FUNCTIONS # |
|
||||||
|
|
||||||
def self.unirex(str) |
|
||||||
Regexp.new str, Regexp::MULTILINE |
|
||||||
end |
|
||||||
def self.rexstr(exp) |
|
||||||
'(?:' + exp.source + ')' |
|
||||||
end |
|
||||||
|
|
||||||
# CHARACTER CLASSES # |
|
||||||
|
|
||||||
DOCUMENT_START = /^/ |
|
||||||
DOCUMENT_END = /$/ |
|
||||||
ALLOWED_CHAR = # c-printable` in the YAML 1.2 spec. |
|
||||||
/[\t\n\r\u{20}-\u{7e}\u{85}\u{a0}-\u{d7ff}\u{e000}-\u{fffd}\u{10000}-\u{10ffff}]/u |
|
||||||
WHITE_SPACE = /[ \t]/ |
|
||||||
INDENTATION = / */ |
|
||||||
LINE_BREAK = /\r?\n|\r|<br\s*\/?>/ |
|
||||||
ESCAPE_CHAR = /[0abt\tnvfre "\/\\N_LP]/ |
|
||||||
HEXADECIMAL_CHARS = /[0-9a-fA-F]/ |
|
||||||
INDICATOR = /[-?:,\[\]{}&#*!|>'"%@`]/ |
|
||||||
FLOW_CHAR = /[,\[\]{}]/ |
|
||||||
|
|
||||||
# NEGATED CHARACTER CLASSES # |
|
||||||
|
|
||||||
NOT_WHITE_SPACE = unirex '(?!' + rexstr(WHITE_SPACE) + ').' |
|
||||||
NOT_LINE_BREAK = unirex '(?!' + rexstr(LINE_BREAK) + ').' |
|
||||||
NOT_INDICATOR = unirex '(?!' + rexstr(INDICATOR) + ').' |
|
||||||
NOT_FLOW_CHAR = unirex '(?!' + rexstr(FLOW_CHAR) + ').' |
|
||||||
NOT_ALLOWED_CHAR = unirex '(?!' + rexstr(ALLOWED_CHAR) + ').' |
|
||||||
|
|
||||||
# BASIC CONSTRUCTS # |
|
||||||
|
|
||||||
ANY_WHITE_SPACE = unirex rexstr(WHITE_SPACE) + '*' |
|
||||||
ANY_ALLOWED_CHARS = unirex rexstr(ALLOWED_CHAR) + '*' |
|
||||||
NEW_LINE = unirex( |
|
||||||
rexstr(ANY_WHITE_SPACE) + rexstr(LINE_BREAK) |
|
||||||
) |
|
||||||
SOME_NEW_LINES = unirex( |
|
||||||
'(?:' + rexstr(ANY_WHITE_SPACE) + rexstr(LINE_BREAK) + ')+' |
|
||||||
) |
|
||||||
POSSIBLE_STARTS = unirex( |
|
||||||
rexstr(DOCUMENT_START) + rexstr(/<p[^<>]*>/) + '?' |
|
||||||
) |
|
||||||
POSSIBLE_ENDS = unirex( |
|
||||||
rexstr(SOME_NEW_LINES) + '|' + |
|
||||||
rexstr(DOCUMENT_END) + '|' + |
|
||||||
rexstr(/<\/p>/) |
|
||||||
) |
|
||||||
CHARACTER_ESCAPE = unirex( |
|
||||||
rexstr(/\\/) + |
|
||||||
'(?:' + |
|
||||||
rexstr(ESCAPE_CHAR) + '|' + |
|
||||||
rexstr(/x/) + rexstr(HEXADECIMAL_CHARS) + '{2}' + '|' + |
|
||||||
rexstr(/u/) + rexstr(HEXADECIMAL_CHARS) + '{4}' + '|' + |
|
||||||
rexstr(/U/) + rexstr(HEXADECIMAL_CHARS) + '{8}' + |
|
||||||
')' |
|
||||||
) |
|
||||||
ESCAPED_CHAR = unirex( |
|
||||||
rexstr(/(?!["\\])/) + rexstr(NOT_LINE_BREAK) + '|' + |
|
||||||
rexstr(CHARACTER_ESCAPE) |
|
||||||
) |
|
||||||
ANY_ESCAPED_CHARS = unirex( |
|
||||||
rexstr(ESCAPED_CHAR) + '*' |
|
||||||
) |
|
||||||
ESCAPED_APOS = unirex( |
|
||||||
'(?=' + rexstr(NOT_LINE_BREAK) + ')' + rexstr(/[^']|''/) |
|
||||||
) |
|
||||||
ANY_ESCAPED_APOS = unirex( |
|
||||||
rexstr(ESCAPED_APOS) + '*' |
|
||||||
) |
|
||||||
FIRST_KEY_CHAR = unirex( |
|
||||||
'(?=' + rexstr(NOT_LINE_BREAK) + ')' + |
|
||||||
'(?=' + rexstr(NOT_WHITE_SPACE) + ')' + |
|
||||||
rexstr(NOT_INDICATOR) + '|' + |
|
||||||
rexstr(/[?:-]/) + |
|
||||||
'(?=' + rexstr(NOT_LINE_BREAK) + ')' + |
|
||||||
'(?=' + rexstr(NOT_WHITE_SPACE) + ')' + |
|
||||||
'(?=' + rexstr(NOT_FLOW_CHAR) + ')' |
|
||||||
) |
|
||||||
FIRST_VALUE_CHAR = unirex( |
|
||||||
'(?=' + rexstr(NOT_LINE_BREAK) + ')' + |
|
||||||
'(?=' + rexstr(NOT_WHITE_SPACE) + ')' + |
|
||||||
rexstr(NOT_INDICATOR) + '|' + |
|
||||||
rexstr(/[?:-]/) + |
|
||||||
'(?=' + rexstr(NOT_LINE_BREAK) + ')' + |
|
||||||
'(?=' + rexstr(NOT_WHITE_SPACE) + ')' |
|
||||||
# Flow indicators are allowed in values. |
|
||||||
) |
|
||||||
LATER_KEY_CHAR = unirex( |
|
||||||
rexstr(WHITE_SPACE) + '|' + |
|
||||||
'(?=' + rexstr(NOT_LINE_BREAK) + ')' + |
|
||||||
'(?=' + rexstr(NOT_WHITE_SPACE) + ')' + |
|
||||||
'(?=' + rexstr(NOT_FLOW_CHAR) + ')' + |
|
||||||
rexstr(/[^:#]#?/) + '|' + |
|
||||||
rexstr(/:/) + '(?=' + rexstr(NOT_WHITE_SPACE) + ')' |
|
||||||
) |
|
||||||
LATER_VALUE_CHAR = unirex( |
|
||||||
rexstr(WHITE_SPACE) + '|' + |
|
||||||
'(?=' + rexstr(NOT_LINE_BREAK) + ')' + |
|
||||||
'(?=' + rexstr(NOT_WHITE_SPACE) + ')' + |
|
||||||
# Flow indicators are allowed in values. |
|
||||||
rexstr(/[^:#]#?/) + '|' + |
|
||||||
rexstr(/:/) + '(?=' + rexstr(NOT_WHITE_SPACE) + ')' |
|
||||||
) |
|
||||||
|
|
||||||
# YAML CONSTRUCTS # |
|
||||||
|
|
||||||
YAML_START = unirex( |
|
||||||
rexstr(ANY_WHITE_SPACE) + rexstr(/---/) |
|
||||||
) |
|
||||||
YAML_END = unirex( |
|
||||||
rexstr(ANY_WHITE_SPACE) + rexstr(/(?:---|\.\.\.)/) |
|
||||||
) |
|
||||||
YAML_LOOKAHEAD = unirex( |
|
||||||
'(?=' + |
|
||||||
rexstr(YAML_START) + |
|
||||||
rexstr(ANY_ALLOWED_CHARS) + rexstr(NEW_LINE) + |
|
||||||
rexstr(YAML_END) + rexstr(POSSIBLE_ENDS) + |
|
||||||
')' |
|
||||||
) |
|
||||||
YAML_DOUBLE_QUOTE = unirex( |
|
||||||
rexstr(/"/) + rexstr(ANY_ESCAPED_CHARS) + rexstr(/"/) |
|
||||||
) |
|
||||||
YAML_SINGLE_QUOTE = unirex( |
|
||||||
rexstr(/'/) + rexstr(ANY_ESCAPED_APOS) + rexstr(/'/) |
|
||||||
) |
|
||||||
YAML_SIMPLE_KEY = unirex( |
|
||||||
rexstr(FIRST_KEY_CHAR) + rexstr(LATER_KEY_CHAR) + '*' |
|
||||||
) |
|
||||||
YAML_SIMPLE_VALUE = unirex( |
|
||||||
rexstr(FIRST_VALUE_CHAR) + rexstr(LATER_VALUE_CHAR) + '*' |
|
||||||
) |
|
||||||
YAML_KEY = unirex( |
|
||||||
rexstr(YAML_DOUBLE_QUOTE) + '|' + |
|
||||||
rexstr(YAML_SINGLE_QUOTE) + '|' + |
|
||||||
rexstr(YAML_SIMPLE_KEY) |
|
||||||
) |
|
||||||
YAML_VALUE = unirex( |
|
||||||
rexstr(YAML_DOUBLE_QUOTE) + '|' + |
|
||||||
rexstr(YAML_SINGLE_QUOTE) + '|' + |
|
||||||
rexstr(YAML_SIMPLE_VALUE) |
|
||||||
) |
|
||||||
YAML_SEPARATOR = unirex( |
|
||||||
rexstr(ANY_WHITE_SPACE) + |
|
||||||
':' + rexstr(WHITE_SPACE) + |
|
||||||
rexstr(ANY_WHITE_SPACE) |
|
||||||
) |
|
||||||
YAML_LINE = unirex( |
|
||||||
'(' + rexstr(YAML_KEY) + ')' + |
|
||||||
rexstr(YAML_SEPARATOR) + |
|
||||||
'(' + rexstr(YAML_VALUE) + ')' |
|
||||||
) |
|
||||||
|
|
||||||
# FRONTMATTER REGEX # |
|
||||||
|
|
||||||
YAML_FRONTMATTER = unirex( |
|
||||||
rexstr(POSSIBLE_STARTS) + |
|
||||||
rexstr(YAML_LOOKAHEAD) + |
|
||||||
rexstr(YAML_START) + rexstr(SOME_NEW_LINES) + |
|
||||||
'(?:' + |
|
||||||
'(' + rexstr(INDENTATION) + ')' + |
|
||||||
rexstr(YAML_LINE) + rexstr(SOME_NEW_LINES) + |
|
||||||
'(?:' + |
|
||||||
'\\1' + rexstr(YAML_LINE) + rexstr(SOME_NEW_LINES) + |
|
||||||
'){0,4}' + |
|
||||||
')?' + |
|
||||||
rexstr(YAML_END) + rexstr(POSSIBLE_ENDS) |
|
||||||
) |
|
||||||
|
|
||||||
# SEARCHES # |
|
||||||
|
|
||||||
FIND_YAML_LINES = unirex( |
|
||||||
rexstr(NEW_LINE) + rexstr(INDENTATION) + rexstr(YAML_LINE) |
|
||||||
) |
|
||||||
|
|
||||||
# STRING PROCESSING # |
|
||||||
|
|
||||||
def process_string(str) |
|
||||||
case str[0] |
|
||||||
when '"' |
|
||||||
str[1..-2] |
|
||||||
when "'" |
|
||||||
str[1..-2].gsub(/''/, "'") |
|
||||||
else |
|
||||||
str |
|
||||||
end |
|
||||||
end |
|
||||||
|
|
||||||
# BIO PROCESSING # |
|
||||||
|
|
||||||
def process_bio content |
|
||||||
result = { |
|
||||||
text: content.gsub(/"/, '"').gsub(/'/, "'"), |
|
||||||
metadata: [] |
|
||||||
} |
|
||||||
yaml = YAML_FRONTMATTER.match(result[:text]) |
|
||||||
return result unless yaml |
|
||||||
yaml = yaml[0] |
|
||||||
start = YAML_START =~ result[:text] |
|
||||||
ending = start + yaml.length - (YAML_START =~ yaml) |
|
||||||
result[:text][start..ending - 1] = '' |
|
||||||
metadata = nil |
|
||||||
index = 0 |
|
||||||
while metadata = FIND_YAML_LINES.match(yaml, index) do |
|
||||||
index = metadata.end(0) |
|
||||||
result[:metadata].push [ |
|
||||||
process_string(metadata[1]), process_string(metadata[2]) |
|
||||||
] |
|
||||||
end |
|
||||||
return result |
|
||||||
end |
|
||||||
|
|
||||||
end |
|
Loading…
Reference in new issue