Skip to content
Snippets Groups Projects
html_md.sh 1.65 KiB
Newer Older
  • Learn to ignore specific revisions
  • Lukáš Krupčík's avatar
    Lukáš Krupčík committed
    #!/bin/bash
    
    Lukáš Krupčík's avatar
    Lukáš Krupčík committed
    
    
    Lukáš Krupčík's avatar
    Lukáš Krupčík committed
    ### DOWNLOAD AND CONVERT DOCUMENTATION
    # autor: kru0052
    
    Lukáš Krupčík's avatar
    Lukáš Krupčík committed
    # version: 1.00 
    
    Lukáš Krupčík's avatar
    Lukáš Krupčík committed
    ###
    
    Lukáš Krupčík's avatar
    Lukáš Krupčík committed
    
    
    Lukáš Krupčík's avatar
    Lukáš Krupčík committed
    if [ "$1" = "-w" ]; then
    	# download html pages 
    
    Lukáš Krupčík's avatar
    Lukáš Krupčík committed
    	rm -rf docs-old.it4i.cz
    
    Lukáš Krupčík's avatar
    Lukáš Krupčík committed
    	wget -X portal_css,portal_javascripts,++resource++jquery-ui-themes,anselm-cluster-documentation/icon.jpg -R favicon.ico,pdf.png,logo.png,background.png,application.png,search_icon.png,png.png,sh.png,touch_icon.png,anselm-cluster-documentation/icon.jpg,*js,robots.txt,*xml,RSS,download_icon.png,@@*,anselm-cluster-documentation/icon.jpg.1 --mirror --convert-links --adjust-extension --page-requisites  --no-parent https://docs-old.it4i.cz;
    
    Lukáš Krupčík's avatar
    Lukáš Krupčík committed
    fi
    if [ "$1" = "-c" ]; then
    
    Lukáš Krupčík's avatar
    Lukáš Krupčík committed
    	# erasing the previous transfer
    
    	if [ -d ./docs.it4i ]; then
    			rm -rf ./docs.it4i
    
    Lukáš Krupčík's avatar
    Lukáš Krupčík committed
    	fi
    	if [ -d ./info ]; then
    			rm -rf ./info;
    	fi
    
    Lukáš Krupčík's avatar
    Lukáš Krupčík committed
    	
    
    Lukáš Krupčík's avatar
    Lukáš Krupčík committed
    	# counter for html and md files	
    
    Lukáš Krupčík's avatar
    Lukáš Krupčík committed
    	counter=1
    	count=$(find . -name "*.html" -type f | wc -l)
    	
    
    Lukáš Krupčík's avatar
    Lukáš Krupčík committed
    	find . -name "*.ht*" | 
    	while read i; 
    	do 
    
    Lukáš Krupčík's avatar
    Lukáš Krupčík committed
    		# filtering html files
    
    Lukáš Krupčík's avatar
    Lukáš Krupčík committed
    		echo "$(tput setaf 12)($counter/$count)$(tput setaf 11)$i"; 
    		counter=$((counter+1))
    
    Lukáš Krupčík's avatar
    Lukáš Krupčík committed
    		printf "\t\tFiltering html files...\n";
    
    Lukáš Krupčík's avatar
    Lukáš Krupčík committed
    		HEAD=$(grep -n -m1 '<h1' "$i" |cut -f1 -d: | tr --delete '\n')
    		END=$(grep -n -m1 '<!-- <div tal:content=' "$i" |cut -f1 -d: | tr --delete '\n')
    		LAST=$(wc -l "$i" | cut -f1 -d' ')
    
    Lukáš Krupčík's avatar
    Lukáš Krupčík committed
    		DOWN=$((LAST-END+2))
    
    
    Lukáš Krupčík's avatar
    Lukáš Krupčík committed
    		sed '1,'"$((HEAD-1))"'d' "$i" | sed -n -e :a -e '1,'"$DOWN"'!{P;N;D;};N;ba' > "${i%.*}TMP.html"	
    
    Lukáš Krupčík's avatar
    Lukáš Krupčík committed
    		
    
    Lukáš Krupčík's avatar
    Lukáš Krupčík committed
    		# converted .html to .md
    
    Lukáš Krupčík's avatar
    Lukáš Krupčík committed
    		printf "\t\t.html => .md\n"
    
    Lukáš Krupčík's avatar
    Lukáš Krupčík committed
    		pandoc -f html -t markdown+pipe_tables-grid_tables "${i%.*}TMP.html" -o "${i%.*}.md"; 
    
    Lukáš Krupčík's avatar
    Lukáš Krupčík committed
    		rm "${i%.*}TMP.html"
    
    Lukáš Krupčík's avatar
    Lukáš Krupčík committed
    	done
    
    Lukáš Krupčík's avatar
    Lukáš Krupčík committed
    	
    
    Lukáš Krupčík's avatar
    Lukáš Krupčík committed
    	# delete empty files
    
    Lukáš Krupčík's avatar
    Lukáš Krupčík committed
    	find -type f -size -10c | 
    	while read i; 
    	do
    		rm "$i"; 	
    
    Lukáš Krupčík's avatar
    Lukáš Krupčík committed
    		echo "$(tput setaf 9)$i deleted"; 
    
    Lukáš Krupčík's avatar
    Lukáš Krupčík committed
    	done
    
    Lukáš Krupčík's avatar
    Lukáš Krupčík committed
    fi