This repository has been archived on 2024-10-30. You can view files and clone it, but cannot push or open issues or pull requests.
swb6-it-sec/Lab04/content/part1/analyse/main.go

129 lines
2.8 KiB
Go
Raw Normal View History

2022-05-30 09:36:08 +02:00
package main
import (
2022-11-14 18:29:26 +01:00
"flag"
2022-05-30 10:07:48 +02:00
"fmt"
"github.com/dariubs/percent"
2022-05-30 11:42:59 +02:00
"gonum.org/v1/plot"
"gonum.org/v1/plot/plotter"
"gonum.org/v1/plot/plotutil"
"gonum.org/v1/plot/vg"
"log"
2022-11-14 18:29:26 +01:00
"os"
2022-05-30 11:02:34 +02:00
"sort"
2022-05-30 09:36:08 +02:00
"strings"
)
2022-05-30 11:02:34 +02:00
type letter struct {
upperCase string
lowerCase string
count int
frequency float64
}
type letterList []letter
func (l letterList) Len() int {
return len(l)
}
2022-11-14 18:29:26 +01:00
func (l letterList) Less(firstIndex, secondIndex int) bool {
return l[firstIndex].frequency > l[secondIndex].frequency
2022-05-30 11:02:34 +02:00
}
2022-11-14 18:29:26 +01:00
func (l letterList) Swap(firstIndex, secondIndex int) {
l[firstIndex], l[secondIndex] = l[secondIndex], l[firstIndex]
2022-05-30 11:02:34 +02:00
}
2022-06-08 16:26:04 +02:00
const lettersInTheAlphabet = 'Z' - 'A' + 1
2022-05-30 11:42:59 +02:00
2022-06-08 16:26:04 +02:00
var letters = make([]letter, lettersInTheAlphabet)
2022-05-30 11:02:34 +02:00
2022-11-14 18:29:26 +01:00
func init() {
2022-06-08 16:26:04 +02:00
for i := 0; i < lettersInTheAlphabet; i++ {
letters[i].upperCase = string(rune('A' + i))
letters[i].lowerCase = string(rune('A' + i + 32))
2022-05-30 11:02:34 +02:00
}
}
2022-11-14 18:29:26 +01:00
func parseArguments() string {
var inputFile string
flag.StringVar(&inputFile, "f", "", "Specify file to analyse.")
flag.Parse()
if inputFile == "" {
log.Print("No flag provided\n\nHelp:\n")
flag.PrintDefaults()
os.Exit(1)
}
return inputFile
}
2022-05-30 11:02:34 +02:00
func readFile(relativePath string) string {
2022-11-14 18:29:26 +01:00
content, err := os.ReadFile(relativePath)
2022-05-30 11:02:34 +02:00
if err != nil {
2022-05-30 11:42:59 +02:00
log.Fatalln(err)
2022-05-30 11:02:34 +02:00
}
return string(content)
}
2022-05-30 10:07:48 +02:00
2022-05-30 11:02:34 +02:00
func countLetters(inputText string) int {
2022-05-30 10:07:48 +02:00
totalCount := 0
2022-06-08 16:26:04 +02:00
for i := 0; i < lettersInTheAlphabet; i++ {
2022-05-30 13:41:45 +02:00
letters[i].count +=
strings.Count(inputText, letters[i].lowerCase) +
strings.Count(inputText, letters[i].upperCase)
totalCount += letters[i].count
2022-05-30 10:07:48 +02:00
}
2022-05-30 11:02:34 +02:00
return totalCount
}
func calculateFrequency(totalCount int) {
2022-06-08 16:26:04 +02:00
for i := 0; i < lettersInTheAlphabet; i++ {
2022-05-30 13:41:45 +02:00
letters[i].frequency = percent.PercentOf(letters[i].count, totalCount)
2022-05-30 10:07:48 +02:00
}
2022-05-30 11:02:34 +02:00
}
func printResult() {
2022-06-08 16:26:04 +02:00
for i := 0; i < lettersInTheAlphabet; i++ {
2022-05-30 13:41:45 +02:00
l := letters[i]
2022-05-30 11:02:34 +02:00
fmt.Printf(
"The letter %s (%s) occurs %d times in the text and the frequencyArray in percent is %0.2f\n",
l.upperCase, l.lowerCase, l.count, l.frequency,
)
2022-05-30 10:07:48 +02:00
}
2022-05-30 09:36:08 +02:00
}
2022-05-30 11:42:59 +02:00
func plotResult() {
var count plotter.Values
2022-06-08 16:26:04 +02:00
for i := 0; i < lettersInTheAlphabet; i++ {
2022-05-30 13:41:45 +02:00
count = append(count, float64(letters[i].count))
2022-05-30 11:42:59 +02:00
}
p := plot.New()
p.Title.Text = "Letter count"
p.X.Label.Text = "letter"
p.Y.Label.Text = "count"
2022-06-08 16:26:04 +02:00
countBars, err := plotter.NewBarChart(count, vg.Points(lettersInTheAlphabet/2))
2022-05-30 11:42:59 +02:00
countBars.Color = plotutil.Color(2)
if err != nil {
log.Fatalln(err)
}
p.Add(countBars)
var xAxisNaming []string
for index := range letters {
xAxisNaming = append(xAxisNaming, letters[index].upperCase)
}
p.NominalX(xAxisNaming...)
2022-11-14 18:29:26 +01:00
if err = p.Save(25*vg.Centimeter, 15*vg.Centimeter, "barChart.png"); err != nil {
2022-05-30 11:42:59 +02:00
log.Fatalln(err)
}
}
2022-05-30 09:36:08 +02:00
func main() {
2022-11-14 18:29:26 +01:00
inputFile := parseArguments()
totalCount := countLetters(readFile(inputFile))
2022-05-30 11:02:34 +02:00
calculateFrequency(totalCount)
2022-05-30 11:42:59 +02:00
plotResult()
2022-05-30 11:02:34 +02:00
sort.Sort(letterList(letters))
printResult()
2022-05-30 10:07:48 +02:00
}