From fe427c85522870ba6c67e21bae3eeda03bfaabef Mon Sep 17 00:00:00 2001 From: Findus23 Date: Sun, 8 Feb 2015 12:13:45 +0100 Subject: [PATCH] Erster Commit --- .gitignore | 5 +++++ README.md | 1 + descr.sh | 28 ++++++++++++++++++++++++++++ descr_gen.sh | 48 ++++++++++++++++++++++++++++++++++++++++++++++++ ikeagen.py | 45 +++++++++++++++++++++++++++++++++++++++++++++ liste.sh | 23 +++++++++++++++++++++++ tex.sh | 16 ++++++++++++++++ 7 files changed, 166 insertions(+) create mode 100644 .gitignore create mode 100644 README.md create mode 100755 descr.sh create mode 100755 descr_gen.sh create mode 100755 ikeagen.py create mode 100755 liste.sh create mode 100755 tex.sh diff --git a/.gitignore b/.gitignore new file mode 100644 index 0000000..0581559 --- /dev/null +++ b/.gitignore @@ -0,0 +1,5 @@ +*.pdf +*.bak +*.tmp +tmp +*.txt diff --git a/README.md b/README.md new file mode 100644 index 0000000..b224e16 --- /dev/null +++ b/README.md @@ -0,0 +1 @@ +# nonsense diff --git a/descr.sh b/descr.sh new file mode 100755 index 0000000..9b1502f --- /dev/null +++ b/descr.sh @@ -0,0 +1,28 @@ +#!/bin/bash +rm nomen.txt +rm adj.txt +grep -E -o '(\w|\.|\-)+' descr.txt | sort | uniq > descr_words.txt + +while read line; do + if [ $(echo $line | cut -c 1) == "-" ] + then + echo $line >> suf.txt + echo "Suffix" + elif [ $(echo $line | rev | cut -c 1) == "-" ] + then + echo $line >> präf.txt + echo "Präfix" + elif echo $line | grep [[:upper:]] >/dev/null + then + if echo $line | grep [[:lower:]] >/dev/null + then #Groß und Klein-> Nomen + echo $line >>nomen.txt + echo "Nomen" + fi # nur Groß -> Ikeaname -> verwerfen + elif echo $line | egrep "([[:lower:]]){3,}" >/dev/null + then # keine Großbuchstaben, aber Kleinbuchstaben -> kein Nomen + echo $line >>adj.txt + echo "kein Nomen" + #weder Großbuchstaben noch Kleinbuchstaben -> Zahl -> verwerfen + fi +done 3: + print("".join(wort)) + textnr +=1 diff --git a/liste.sh b/liste.sh new file mode 100755 index 0000000..fc09365 --- /dev/null +++ b/liste.sh @@ -0,0 +1,23 @@ +#!/bin/bash +rm ikeaname.txt +rm descr.txt + +for i in {0..25} +do + wget -O download.tmp http://www.ikea.com/at/de/catalog/productsaz/$i/ + grep "productsAzLink" download.tmp > lines.tmp + while read line; do + name=$(echo $line | xmllint --xpath 'string(//a)' -) + ikeaname=$(echo "$name" | egrep -o "((([A-Z])+){2,} *)+") + descr=${name#$ikeaname} + echo $ikeaname >> ikeaname.txt + echo $descr >> descr.txt + done ikeaname.txt.tmp +sort descr.txt | uniq > descr.txt.tmp +mv ikeaname.txt.tmp ikeaname.txt +mv descr.txt.tmp descr.txt + diff --git a/tex.sh b/tex.sh new file mode 100755 index 0000000..982b809 --- /dev/null +++ b/tex.sh @@ -0,0 +1,16 @@ +#!/bin/bash +inhalt=$(./descr_gen.sh $1 tex-export) +echo $inhalt +echo "\documentclass[14pt,a4paper]{article} +\usepackage[utf8]{inputenc} +\usepackage[ngerman]{babel} +\usepackage[T1]{fontenc} +\author{Lukas Winkler} +\begin{document} + +\begin{tabular}{rl} +$inhalt +\end{tabular} +\end{document}" > IKEA.tex +pdflatex IKEA.tex +rm IKEA.tex IKEA.log IKEA.aux