gsl-statique-litterateur/var/lib/gsl/scripts/gsl__post_checkers

574 lines
13 KiB
Plaintext
Raw Normal View History

#!/bin/bash
# file: gsl__post_checkers
# Folder: /var/lib/gsl/scripts
# By echolib
# License: GNU AFFERO GENERAL PUBLIC LICENSE Version 3, 19 November 2007
#----------------------------------------------------------------------
2022-02-21 17:25:08 +01:00
# --------------------------------------------------
# From: gsl__loop_posts | MAIN checkers from modules
# --------------------------------------------------
#----------------------------------------------------------------------
2022-02-21 17:25:08 +01:00
gsl__all_checkers() {
2022-03-12 16:51:33 +01:00
# Init Stats
gsl_stat_abbr=0
gsl_stat_abbrs=0
gsl_stat_link=0
gsl_stat_links=0
gsl_stat_file=0
gsl_count_files=0
gsl_stat_image=0
gsl_stat_fcode=0
2022-03-01 18:39:46 +01:00
gsl_db_tmp=`mktemp`
2022-02-27 19:16:16 +01:00
gsl__check_h1 || return
gsl__post_content_only
2022-02-27 19:16:16 +01:00
gsl__get_needed_headers
gsl__check_type
gsl__check_headers
gsl__check_paragraphs "$gsl_tmp_post"
gsl__check_blockquote "$gsl_tmp_post"
2022-02-27 19:16:16 +01:00
gsl__do_header check "$gsl_marker_link" "$gsl_post"
gsl__do_header check "$gsl_marker_abbr" "$gsl_post"
gsl__do_header check "$gsl_marker_file" "$gsl_post"
gsl__do_header check "$gsl_marker_image" "$gsl_post"
gsl__do_header check "$gsl_marker_code" "$gsl_post"
gsl__stat_words "$gsl_tmp_post"
gsl__do_strongs_bolds stats "$gsl_tmp_post"
gsl__do_italics stats "$gsl_tmp_post"
gsl__do_icode stats "$gsl_tmp_post"
2022-02-27 19:16:16 +01:00
rm -f "$gsl_tmp_post"
2022-02-15 12:42:54 +01:00
echo -ne "\r\033[2K"
2022-02-15 17:56:45 +01:00
2022-03-27 18:46:48 +02:00
gsl__db_set_post_status chk
2022-03-01 18:39:46 +01:00
rm -f "$gsl_db_tmp"
}
#----------------------------------------------------------------------
2022-02-21 17:25:08 +01:00
# -------------------------------------------------
2022-02-27 19:16:16 +01:00
# Modules checkers
2022-02-21 17:25:08 +01:00
# -------------------------------------------------
#----------------------------------------------------------------------
#======================================================================
2022-02-27 19:16:16 +01:00
# Check Post for begining content
#======================================================================
2022-02-27 19:16:16 +01:00
gsl__check_h1() {
echo -ne ": Searching for #1..."
gsl_post_begin=`
2022-04-11 18:06:38 +02:00
grep -n "#1" $gsl_post \
2022-02-27 19:16:16 +01:00
| head -1 \
| awk -F: '{print $1}'`
if ! [[ "$gsl_post_begin" ]];then
gsl__logs_print \
"$gsl_log_e" \
"Post" \
"$gsl_log_c_h1" \
"Missing: #1 TITLE" \
"${PWD}/$gsl_post"
gsl_checker_err=true
fi
}
#======================================================================
2022-02-27 19:16:16 +01:00
# Check/Set Post Type
#======================================================================
2022-02-27 19:16:16 +01:00
gsl__check_type() {
echo -ne "\r\033[2K: Searching for Post TYPE..."
case "$gsl_post_type" in
page|post)
gsl__logs_print \
"$gsl_log_i" \
"Post" \
"Set as" \
"$gsl_post_type: $gsl_post" \
"${PWD}/$gsl_post"
;;
*)
2022-03-10 14:47:00 +01:00
gsl_post_type="post"
sed -i "1i$gsl_marker_type$gsl_post_type" \
2022-02-27 19:16:16 +01:00
"$gsl_post" && \
gsl__logs_print \
"$gsl_log_w" \
"Post" \
"Set as" \
2022-03-10 14:47:00 +01:00
"Default: $gsl_post_type for $gsl_post" \
2022-02-27 19:16:16 +01:00
"${PWD}/$gsl_post"
2022-03-10 14:47:00 +01:00
gsl__get_sum "$gsl_post"
2022-02-27 19:16:16 +01:00
;;
esac
}
#======================================================================
# Check for paragraphs ( and ) | $1: File
#======================================================================
2022-02-27 19:16:16 +01:00
gsl__check_paragraphs() {
echo -ne "\r\033[2K: Searching for Paragraphs..."
gsl_post_p_open=`
awk -v op="$gsl_mo_p" \
'$1 == op' \
"$1" \
2022-02-27 19:16:16 +01:00
| wc -l`
gsl_post_p_close=`
awk -v cp="$gsl_mc_p" \
'$1 == cp' \
"$1" \
2022-02-27 19:16:16 +01:00
| wc -l`
if (( "$gsl_post_p_open" == 0 ));then
gsl__logs_print \
"$gsl_log_e" \
"Post" \
"$gsl_loc_c_p" \
"Missing: ( and ) at begining lines" \
"${PWD}/$gsl_post"
gsl_checker_err=true
return
fi
if (( "$gsl_post_p_open" == "$gsl_post_p_close" ));then
gsl_stat_p="$gsl_post_p_open"
else
gsl__logs_print \
"$gsl_log_e" \
"Post" \
"$gsl_log_c_p" \
"Mismatch: (=$gsl_post_p_open ; )=$gsl_post_p_close" \
"${PWD}/$gsl_post"
gsl_checker_err=true
return
fi
}
#======================================================================
# Check for blockquotes: --- | $1: File
#======================================================================
2022-02-27 19:16:16 +01:00
gsl__check_blockquote() {
echo -ne "\r\033[2K: Searching for BLOCKQUOTEs..."
gsl_post_blockquotes_nbr=`
awk -v bq="$gsl_mark_blockquote" \
'$1 == bq' \
"$1" \
2022-02-27 19:16:16 +01:00
| wc -l`
gsl_post_blockquotes_nbr_r=$(( $gsl_post_blockquotes_nbr % 2 ))
if [[ "$gsl_post_blockquotes_nbr_r" -eq 0 ]];then
gsl_stat_bq=$(( $gsl_post_blockquotes_nbr / 2 ))
else
gsl__logs_print \
"$gsl_log_e" \
"Post" \
"$gsl_log_c_cite" \
"Mismatch: --- not paired" \
"${PWD}/$gsl_post"
gsl_checker_err=true
fi
}
#======================================================================
# From gsl__do_header: Check Link
#======================================================================
gsl__check_link() {
# Get & Check Header CONTENT
gsl__check_header_fields \
"Post" "$gsl_log_h_link" "$gsl_log_act_link" \
|| return
echo -ne "\r\033[2K: Searching for Links... $gsl_post_hf_1"
# No ALT TEXT ?
gsl__check_header_field3 "Post" "$gsl_log_h_link" "$gsl_marker_link"
gsl_count_links=`
gsl__get_content_line "_$gsl_post_hf_1" "$gsl_post" | wc -l
`
if (( "$gsl_count_links" > 0 ));then
# Check URL
2022-03-01 18:39:46 +01:00
gsl_url_status=`
2022-03-21 12:12:37 +01:00
timeout 2 curl -o /dev/null --silent --head --write-out \
2022-02-27 19:16:16 +01:00
'%{http_code}' \
2022-03-21 12:12:37 +01:00
"$gsl_post_hf_2" 2>/dev/null || echo "408"`
2022-02-27 19:16:16 +01:00
2022-03-06 10:55:41 +01:00
case "$gsl_url_status" in
2022-04-12 01:20:16 +02:00
0*|1*|2*|3*)
2022-03-06 10:55:41 +01:00
gsl__logs_print \
"$gsl_log_i" \
"Post" \
"$gsl_log_h_link" \
"Online:$gsl_url_status ${gsl_post_hf_2:0:40}..." \
"${PWD}/$gsl_post"
;;
""|*)
gsl__logs_print \
2022-04-12 01:20:16 +02:00
"$gsl_log_w" \
2022-03-06 10:55:41 +01:00
"Post" \
"$gsl_log_h_link" \
"Offline:$gsl_url_status ${gsl_post_hf_2:0:40}..." \
"${PWD}/$gsl_post"
2022-04-12 01:14:42 +02:00
gsl_checker_war=true
2022-03-06 10:55:41 +01:00
;;
esac
2022-02-27 19:16:16 +01:00
# Stats
((gsl_stat_link++))
gsl_stat_links=$(( gsl_stat_links + gsl_count_links ))
else
gsl__logs_print \
"$gsl_log_i" \
"Post" \
"$gsl_log_c_link" \
"Missing: _$gsl_post_hf_1" \
"${PWD}/$gsl_post"
2022-04-12 01:20:16 +02:00
gsl_checker_err=true
2022-02-27 19:16:16 +01:00
fi
}
#======================================================================
# From gsl__do_header: Check ABBR
#======================================================================
gsl__check_abbr() {
gsl__check_header_fields \
"Post" "$gsl_log_h_abbr" "$gsl_log_act_abbr" \
|| return
echo -ne "\r\033[2K: Searching for ABBRs... $gsl_post_hf_1"
gsl_count_abbrs=`
gsl__get_content_line "$gsl_post_hf_1" "$gsl_post" | wc -l`
if (( "$gsl_count_abbrs" > 0 ));then
((gsl_stat_abbr++))
gsl_stat_abbrs=$(( gsl_stat_abbrs + gsl_count_abbrs ))
else
# Missing CONTENT
gsl__logs_print \
"$gsl_log_e" \
"Post" \
"$gsl_log_c_abbr" \
"Missing: $gsl_post_header_field_1" \
"${PWD}/$gsl_post"
gsl_checker_err=true
fi
}
#======================================================================
# From gsl__do_header: Check Files
#======================================================================
gsl__check_file() {
gsl__check_header_fields \
"Post" "$gsl_log_h_file" "$gsl_log_act_file" \
|| return
echo -ne "\r\033[2K: Searching for Content Files... $gsl_post_hf_1"
gsl__check_header_field3 "Post" "$gsl_log_h_file" "$gsl_marker_file"
# File exists in folder
if ! [[ -f "$gsl_dir_domain_files/$gsl_post_hf_2" ]];then
gsl__logs_print \
"$gsl_log_e" \
"Post" \
"Header $gsl_marker_file" \
"Not found: $gsl_post_hf_2" \
"$gsl_dir_domain_files/$gsl_post_hf_2"
gsl_checker_err=true
else
# Register file to DB with hash
gsl_file_csum=`
cksum "$gsl_dir_domain_files/$gsl_post_hf_2" \
| awk '{print $1}'`
2022-03-01 18:39:46 +01:00
printf '%s\n' \
"File:$gsl_dir_domain_images/$gsl_post_hf_2:$gsl_file_csum" \
>> "$gsl_db_tmp"
2022-02-27 19:16:16 +01:00
fi
# Exists in Content
gsl_count_files=`
gsl__get_content_line "__$gsl_post_hf_1" "$gsl_post" | wc -l`
if (( $gsl_count_files > 0 ));then
((gsl_stat_file++))
else
gsl__logs_print \
"$gsl_log_e" \
"Post" \
"$gsl_log_c_file" \
"Missing: __$gsl_post_hf_1" \
"${PWD}/$gsl_post"
gsl_checker_err=true
fi
}
#======================================================================
# From gsl__do_header: Check Files
#======================================================================
gsl__check_image() {
gsl__check_header_fields \
"Post" "$gsl_log_h_image" "$gsl_log_act_image" \
|| return
echo -ne "\r\033[2K: Searching for Images... $gsl_post_hf_1"
gsl__check_header_field3 "Post" "$gsl_log_h_image" "$gsl_marker_image" \
|| return
# File exists in folder
2022-03-01 18:39:46 +01:00
if ! [[ -f "$gsl_dir_domain_images/$gsl_post_hf_2" ]];then
2022-02-27 19:16:16 +01:00
gsl__logs_print \
"$gsl_log_e" \
"Post" \
"$gsl_log_h_image" \
"Not found: $gsl_post_hf_2" \
2022-03-01 18:39:46 +01:00
"$gsl_dir_domain_images/$gsl_post_hf_2"
2022-02-27 19:16:16 +01:00
gsl_checker_err=true
else
# Register file to DB with hash
gsl_file_csum=`
2022-03-01 18:39:46 +01:00
cksum "$gsl_dir_domain_images/$gsl_post_hf_2" \
2022-02-27 19:16:16 +01:00
| awk '{print $1}'`
2022-03-01 18:39:46 +01:00
printf '%s\n' \
"Image:$gsl_dir_domain_images/$gsl_post_hf_2:$gsl_file_csum" \
>> "$gsl_db_tmp"
2022-02-27 19:16:16 +01:00
fi
# Exists in Content
2022-03-01 18:39:46 +01:00
gsl_count_images=`
2022-03-02 17:25:23 +01:00
gsl__get_content_line "_image:$gsl_post_hf_1" "$gsl_post" | wc -l`
2022-02-27 19:16:16 +01:00
2022-03-01 18:39:46 +01:00
if (( $gsl_count_images > 0 ));then
2022-02-27 19:16:16 +01:00
2022-03-01 18:39:46 +01:00
((gsl_stat_image++))
2022-02-27 19:16:16 +01:00
else
gsl__logs_print \
"$gsl_log_e" \
"Post" \
"$gsl_log_c_image" \
2022-03-02 17:25:23 +01:00
"Missing: _image:$gsl_post_hf_1" \
2022-02-27 19:16:16 +01:00
"${PWD}/$gsl_post"
gsl_checker_err=true
fi
}
#======================================================================
# From gsl__do_header: Check Files
#======================================================================
gsl__check_fcode() {
2022-03-12 16:16:21 +01:00
2022-02-27 19:16:16 +01:00
gsl__check_header_fields \
"Post" "$gsl_log_h_code" "$gsl_log_act_code" \
|| return
echo -ne "\r\033[2K: Searching for File Codes... $gsl_post_hf_1"
gsl__check_header_field3 "Post" "$gsl_log_h_code" "$gsl_marker_code" \
# File exists in folder
if ! [[ -f "$gsl_dir_domain_files/$gsl_post_hf_2" ]];then
gsl__logs_print \
"$gsl_log_e" \
"Post" \
"$gsl_log_h_code" \
"Not found: $gsl_post_hf_2" \
"$gsl_dir_domain_files/$gsl_post_hf_2"
gsl_checker_err=true
else
# Register file to DB with hash
gsl_file_csum=`
cksum "$gsl_dir_domain_files/$gsl_post_hf_2" \
| awk '{print $1}'`
2022-03-01 18:39:46 +01:00
printf '%s\n' \
"FCode:$gsl_dir_domain_filess/$gsl_post_hf_2:$gsl_file_csum" \
>> "$gsl_db_tmp"
2022-02-27 19:16:16 +01:00
fi
# Exists in Content
gsl_count_fcodes=`
2022-03-02 17:25:23 +01:00
gsl__get_content_line "_code:$gsl_post_hf_1" "$gsl_post" | wc -l`
2022-02-27 19:16:16 +01:00
if (( $gsl_count_fcodes > 0 ));then
2022-03-12 16:16:21 +01:00
((gsl_stat_fcode++))
2022-02-27 19:16:16 +01:00
else
gsl__logs_print \
"$gsl_log_e" \
"Post" \
"$gsl_log_c_code" \
2022-03-02 17:25:23 +01:00
"Missing: _code:$gsl_post_hf_1" \
2022-02-27 19:16:16 +01:00
"${PWD}/$gsl_post"
2022-03-12 16:16:21 +01:00
gsl_checker_err=true
2022-02-27 19:16:16 +01:00
fi
}
#======================================================================
# Stat: Count words
#======================================================================
gsl__stat_words() {
echo -ne "\r\033[2K: Counting Words..."
gsl_stat_words=`cat "$1" | wc -w`
2022-02-27 19:16:16 +01:00
gsl_stat_words=$(( $gsl_stat_words - 2*$gsl_stat_p ))
}
2022-02-27 19:16:16 +01:00
#======================================================================
2022-02-14 02:57:58 +01:00
# Check Post for MISSING & VALID Content HEADERS
#======================================================================
2022-02-27 19:16:16 +01:00
gsl__check_headers() {
echo -ne "\r\033[2K: Searching HEADERS..."
#--------------------------------
# Check if Missing NEEDED HEADERS
2022-02-27 19:16:16 +01:00
#--------------------------------
# Title
2022-02-27 19:16:16 +01:00
echo -ne "\r\033[2K: Searching HEADERS... $gsl_header_title"
gsl__check_needed_headers \
2022-02-27 19:16:16 +01:00
"$gsl_header_title" \
"$gsl_marker_title" \
"POST TITLE"
# Slug
2022-02-27 19:16:16 +01:00
echo -ne "\r\033[2K: Searching HEADERS... $gsl_header_slug"
gsl__check_needed_headers \
2022-02-27 19:16:16 +01:00
"$gsl_header_slug" \
"$gsl_marker_slug" \
"POST-TITLE" \
&& gsl_slug_err=true
# Author
2022-02-27 19:16:16 +01:00
echo -ne "\r\033[2K: Searching HEADERS... $gsl_header_author"
gsl__check_needed_headers \
2022-02-27 19:16:16 +01:00
"$gsl_header_author" \
"$gsl_marker_author" \
"REGISTRED NAME" \
&& gsl_author_err=true
# Date
2022-02-27 19:16:16 +01:00
echo -ne "\r\033[2K: Searching HEADERS... $gsl_header_date"
gsl__check_needed_headers \
2022-02-27 19:16:16 +01:00
"$gsl_header_date" \
"$gsl_marker_date" \
"YYYY-MM-DD" \
&& gsl_date_err=true
# Description
2022-02-27 19:16:16 +01:00
echo -ne "\r\033[2K: Searching HEADERS... ${gsl_header_info:0:40}..."
gsl__check_needed_headers \
2022-02-27 19:16:16 +01:00
"$gsl_header_info" \
"$gsl_marker_info" \
"DESCRIPTION"
# Tags
2022-02-27 19:16:16 +01:00
echo -ne "\r\033[2K: Searching HEADERS... ${gsl_header_tags:0:40}..."
gsl__check_needed_headers \
2022-02-27 19:16:16 +01:00
"$gsl_header_tags" \
"$gsl_marker_tags" \
"TAG1,OTHER TAG2,TAG3"
2022-02-27 19:16:16 +01:00
#--------------------------------
2022-02-14 02:57:58 +01:00
# Check for VALID Content HEADERS
2022-02-27 19:16:16 +01:00
#--------------------------------
# Author registred
2022-02-14 02:57:58 +01:00
if ! [[ "$gsl_author_err" ]] && \
! [[ `grep "$gsl_header_author" "$gsl_file_auth_ndd"` ]];then
gsl__logs_print \
"$gsl_log_e" \
"Post" \
"Header $gsl_marker_author" \
"$gsl_header_author not registred for domain $gsl_find_domain" \
"${PWD}/$gsl_post"
2022-02-14 02:57:58 +01:00
gsl_checker_err=true
2022-02-27 19:16:16 +01:00
fi
# Date Format YYYY-MM-DD
2022-02-14 02:57:58 +01:00
if ! [[ "$gsl_date_err" ]] && \
! [[ "$gsl_header_date" =~ $gsl_test_date ]];then
gsl__logs_print \
"$gsl_log_e" \
"Post" \
"Header $gsl_marker_date" \
"$gsl_header_date not YYYY-MM-DD" \
"${PWD}/$gsl_post"
2022-02-14 02:57:58 +01:00
gsl_checker_err=true
2022-02-27 19:16:16 +01:00
fi
# Slug format title-post
2022-02-14 02:57:58 +01:00
if ! [[ "$gsl_slug_err" ]];then
gsl_header_slug_test=${gsl_header_slug// /-}
if ! [[ "$gsl_header_slug" == "$gsl_header_slug_test" ]];then
2022-02-27 19:16:16 +01:00
2022-02-14 02:57:58 +01:00
gsl_new_header_slug="$gsl_marker_slug$gsl_header_slug_test"
sed -i \
"s|$gsl_marker_slug$gsl_header_slug|$gsl_new_header_slug|" \
2022-02-14 02:57:58 +01:00
"$gsl_post" && \
gsl__logs_print \
"$gsl_log_w" \
"Post" \
"Header $gsl_marker_slug" \
"Changed: $gsl_header_slug_test" \
"${PWD}/$gsl_post"
2022-02-14 02:57:58 +01:00
2022-03-10 14:47:00 +01:00
gsl__get_sum "$gsl_post"
2022-02-14 02:57:58 +01:00
gsl_header_slug=$gsl_header_slug_test
gsl_checker_war=true
2022-02-27 19:16:16 +01:00
fi
2022-02-14 02:57:58 +01:00
fi
}