-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy path03_preprocess_data.go
90 lines (72 loc) · 1.53 KB
/
03_preprocess_data.go
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
package main
import (
"encoding/csv"
"log"
"os"
"path/filepath"
"strconv"
"strings"
)
var (
fileName = "loan_data.csv"
saveName = "clean_loan_data.csv"
filePath = filepath.Join(os.Getenv("MLGO"), "storage", "data", fileName)
savePath = filepath.Join(os.Getenv("MLGO"), "storage", "data", saveName)
)
const (
scoreMax = 830.0
scoreMin = 640.0
)
func main() {
f, err := os.Open(filePath)
if err != nil {
log.Fatal(err)
}
defer f.Close()
reader := csv.NewReader(f)
reader.FieldsPerRecord = 2
rawData, err := reader.ReadAll()
if err != nil {
log.Fatal(err)
}
f, err = os.Create(savePath)
if err != nil {
log.Fatal(err)
}
defer f.Close()
w := csv.NewWriter(f)
for idx, record := range rawData {
if idx == 0 {
if err := w.Write([]string{"FICO_score", "class"}); err != nil {
log.Fatal(err)
}
continue
}
outRecord := make([]string, 2)
score, err := strconv.ParseFloat(strings.Split(record[0], "-")[0], 64)
if err != nil {
log.Fatal(err)
}
outRecord[0] = strconv.FormatFloat((score-scoreMin)/(scoreMax-scoreMin), 'f', 4, 64)
rate, err := strconv.ParseFloat(strings.TrimSuffix(record[1], "%"), 64)
if err != nil {
log.Fatal(err)
}
if rate <= 12.0 {
outRecord[1] = "1.0"
if err := w.Write(outRecord); err != nil {
log.Fatal(err)
}
continue
}
outRecord[1] = "0.0"
if err := w.Write(outRecord); err != nil {
log.Fatal(err)
}
}
// buffer에 저장된 데이터를 표준 출력에 write
w.Flush()
if err := w.Error(); err != nil {
log.Fatal(err)
}
}