swatson
/
git-site-gen


			
				
					
						
						
							123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129
							package Gsg::MdParse;
use strict;
use warnings;
use Log::Log4perl qw(:easy);
use Exporter qw(import);
our @EXPORT_OK = qw(render_readme);

sub link_line($) {

	my $line = shift;
	if ( $line =~ m/(<(http.*)>)/ ) {
		my $markup_link = $1;
		my $link = $2;
		my $link_replace = "<a href=\"$link\">$link</a>";
		$line =~ s/\Q$1\E/$link_replace/g;
		return $line;
	}

	return $line;

}

sub strike_line($) {

	my $line = shift;
	#if ( $line =~ m/~~(.*)~~/ ) {
	if ( $line =~ m/^(.*)~~(.*)~~(.*)/ ) {
		$line = "$1<s>$2</s>$3";
		return $line;
	}

	return $line;

}

# README content is passed in as a var, sub returned an HTML version of the parsed markdown
sub render_readme($$) {

	my $readme_content = shift;
	my $logger = shift;

	my $html_readme;
	# Might be a better way to do this? TODO
	open my $fh, '>>', \$html_readme or die "Can't open variable: $!";

	# Main parsing logic, doing it line by line
	# I have some ideas on how to make this more robust/efficient,
	# but starting with below for POC
	# TODO:
	# Headers parsing can be one concise subroutine
	# Started building a suite of simple subs to handle everything else,
	# each line should be run through the 'sub suite' to handle all parsing
	my @readme_lines = split("\n", $readme_content);
	my $inside_code = 0;
	foreach my $line ( @readme_lines ) {
		# HEADERS
		if ( $line =~ m/^#{1}(?!#)(.*)#$|^#{1}(?!#)(.*)$/ && $inside_code == 0 ) {
			my $parsed_line;
			if ( ! defined $1 || $1 eq "" ) {
				$parsed_line = "<h1>$2</h1>";
			} else {
				$parsed_line = "<h1>$1</h1>";
			}
			print $fh "$parsed_line";
		} elsif ( $line =~ m/^#{2}(?!#)(.*)#{2}$|^#{2}(?!#)(.*)$/ && $inside_code == 0) {
			my $parsed_line;
			if ( ! defined $1 || $1 eq "" ) {
				$parsed_line = "<h2>$2</h2>";
			} else {
				$parsed_line = "<h2>$1</h2>";
			}
			print $fh "$parsed_line";
		} elsif ( $line =~ m/^#{3}(?!#)(.*)#{3}$|^#{3}(?!#)(.*)$/ && $inside_code == 0) {
			my $parsed_line;
			if ( ! defined $1 || $1 eq "" ) {
				$parsed_line = "<h3>$2</h3>";
			} else {
				$parsed_line = "<h3>$1</h3>";
			}
			print $fh "$parsed_line";
		} elsif ( $line =~ m/^#{4}(?!#)(.*)#{4}$|^#{4}(?!#)(.*)$/ && $inside_code == 0) {
			my $parsed_line;
			if ( ! defined $1 || $1 eq "" ) {
				$parsed_line = "<h4>$2</h4>";
			} else {
				$parsed_line = "<h4>$1</h4>";
			}
			print $fh "$parsed_line";
		} elsif ( $line =~ m/^#{5}(?!#)(.*)#{5}$|^#{5}(?!#)(.*)$/ && $inside_code == 0) {
			my $parsed_line;
			if ( ! defined $1 || $1 eq "" ) {
				$parsed_line = "<h5>$2</h5>";
			} else {
				$parsed_line = "<h5>$1</h5>";
			}
			print $fh "$parsed_line";
		} elsif ( $line =~ m/^\*(.*)/ && $inside_code == 0) {
			$line = strike_line($1);
			$line = link_line($line);
			my $parsed_line = "<ul><li>$line</li></ul>";
			print $fh "$parsed_line";
		} elsif ( $line =~ m/^```$/ ) {
			if ( $inside_code == 0 ) {
				$inside_code = 1;
				print $fh "<br>";
			} elsif ( $inside_code == 1 ) {
				$inside_code = 0;
			}
		} elsif ( $inside_code == 1 ) { 
			print $fh "<code>$line</code><br>";
		} elsif ( $line =~ m/(http.*)/ ) {
			$line = link_line($line);
			print $fh "$line<br>";
		} elsif ( $line =~ m/^~~(.*)~~/ ) {
			$line = strike_line($line);
			print $fh "$line<br>";
		}
		else {
			print $fh "$line<br>";
		}
	}

	print $fh "<br>";
	close $fh;
	$logger->info("Parsed README");
	return $html_readme;

}
1;