-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathprep.drawio
162 lines (162 loc) · 16.6 KB
/
prep.drawio
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
<mxfile host="app.diagrams.net" modified="2021-10-13T15:24:30.921Z" agent="5.0 (Macintosh; Intel Mac OS X 10_15_7) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/94.0.4606.81 Safari/537.36" etag="UOZSTwaqPv2furvwkqX5" version="15.5.0" type="github">
<diagram id="C5RBs43oDa-KdzZeNtuy" name="Page-1">
<mxGraphModel dx="786" dy="993" grid="1" gridSize="10" guides="1" tooltips="1" connect="1" arrows="1" fold="1" page="1" pageScale="1" pageWidth="827" pageHeight="1169" math="0" shadow="0">
<root>
<mxCell id="WIyWlLk6GJQsqaUBKTNV-0" />
<mxCell id="WIyWlLk6GJQsqaUBKTNV-1" parent="WIyWlLk6GJQsqaUBKTNV-0" />
<mxCell id="WIyWlLk6GJQsqaUBKTNV-2" value="" style="rounded=0;html=1;jettySize=auto;orthogonalLoop=1;fontSize=11;endArrow=block;endFill=0;endSize=8;strokeWidth=1;shadow=0;labelBackgroundColor=none;edgeStyle=orthogonalEdgeStyle;" parent="WIyWlLk6GJQsqaUBKTNV-1" source="WIyWlLk6GJQsqaUBKTNV-3" target="WIyWlLk6GJQsqaUBKTNV-6" edge="1">
<mxGeometry relative="1" as="geometry" />
</mxCell>
<mxCell id="WIyWlLk6GJQsqaUBKTNV-3" value="<font style="font-size: 10px">언론기사 수집<br></font><font style="font-size: 8px">조선일보, 한국일보, 경향신문<br>검색 키워드: 재난지원금, 재난기본소득<br></font>" style="rounded=1;whiteSpace=wrap;html=1;fontSize=11;glass=0;strokeWidth=1;shadow=0;" parent="WIyWlLk6GJQsqaUBKTNV-1" vertex="1">
<mxGeometry x="130" y="100" width="137" height="60" as="geometry" />
</mxCell>
<mxCell id="WIyWlLk6GJQsqaUBKTNV-4" value="작업" style="rounded=0;html=1;jettySize=auto;orthogonalLoop=1;fontSize=11;endArrow=block;endFill=0;endSize=8;strokeWidth=1;shadow=0;labelBackgroundColor=none;edgeStyle=orthogonalEdgeStyle;" parent="WIyWlLk6GJQsqaUBKTNV-1" source="WIyWlLk6GJQsqaUBKTNV-6" target="WIyWlLk6GJQsqaUBKTNV-10" edge="1">
<mxGeometry y="22" relative="1" as="geometry">
<mxPoint as="offset" />
</mxGeometry>
</mxCell>
<mxCell id="WIyWlLk6GJQsqaUBKTNV-5" value="결과" style="edgeStyle=orthogonalEdgeStyle;rounded=0;html=1;jettySize=auto;orthogonalLoop=1;fontSize=9;endArrow=block;endFill=0;endSize=8;strokeWidth=1;shadow=0;labelBackgroundColor=none;" parent="WIyWlLk6GJQsqaUBKTNV-1" source="WIyWlLk6GJQsqaUBKTNV-6" target="WIyWlLk6GJQsqaUBKTNV-7" edge="1">
<mxGeometry y="10" relative="1" as="geometry">
<mxPoint as="offset" />
</mxGeometry>
</mxCell>
<mxCell id="WIyWlLk6GJQsqaUBKTNV-6" value="<font><span style="font-size: 10px">인용문 추출</span><br></font>" style="rhombus;whiteSpace=wrap;html=1;shadow=0;fontFamily=Helvetica;fontSize=11;align=center;strokeWidth=1;spacing=6;spacingTop=-4;" parent="WIyWlLk6GJQsqaUBKTNV-1" vertex="1">
<mxGeometry x="148.5" y="200" width="100" height="80" as="geometry" />
</mxCell>
<mxCell id="WIyWlLk6GJQsqaUBKTNV-7" value="<font style="font-size: 10px">인용문<br></font><font style="font-size: 9px">(n = 2,861)</font>" style="rounded=1;whiteSpace=wrap;html=1;fontSize=11;glass=0;strokeWidth=1;shadow=0;" parent="WIyWlLk6GJQsqaUBKTNV-1" vertex="1">
<mxGeometry x="314" y="220" width="80" height="40" as="geometry" />
</mxCell>
<mxCell id="WIyWlLk6GJQsqaUBKTNV-8" value="작업" style="rounded=0;html=1;jettySize=auto;orthogonalLoop=1;fontSize=11;endArrow=block;endFill=0;endSize=8;strokeWidth=1;shadow=0;labelBackgroundColor=none;edgeStyle=orthogonalEdgeStyle;entryX=0.5;entryY=0;entryDx=0;entryDy=0;" parent="WIyWlLk6GJQsqaUBKTNV-1" source="WIyWlLk6GJQsqaUBKTNV-10" target="TpO_H_RYObl5JqrHC5Rp-1" edge="1">
<mxGeometry y="22" relative="1" as="geometry">
<mxPoint as="offset" />
</mxGeometry>
</mxCell>
<mxCell id="WIyWlLk6GJQsqaUBKTNV-9" value="결과" style="edgeStyle=orthogonalEdgeStyle;rounded=0;html=1;jettySize=auto;orthogonalLoop=1;fontSize=9;endArrow=block;endFill=0;endSize=8;strokeWidth=1;shadow=0;labelBackgroundColor=none;" parent="WIyWlLk6GJQsqaUBKTNV-1" source="WIyWlLk6GJQsqaUBKTNV-10" target="WIyWlLk6GJQsqaUBKTNV-12" edge="1">
<mxGeometry y="10" relative="1" as="geometry">
<mxPoint as="offset" />
</mxGeometry>
</mxCell>
<mxCell id="WIyWlLk6GJQsqaUBKTNV-10" value="<font style="font-size: 10px">데이터 1차 정제<br></font><font style="font-size: 8px">중복값 제거</font>" style="rhombus;whiteSpace=wrap;html=1;shadow=0;fontFamily=Helvetica;fontSize=11;align=center;strokeWidth=1;spacing=6;spacingTop=-4;" parent="WIyWlLk6GJQsqaUBKTNV-1" vertex="1">
<mxGeometry x="148.5" y="320" width="100" height="80" as="geometry" />
</mxCell>
<mxCell id="WIyWlLk6GJQsqaUBKTNV-11" value="n = 1,499" style="rounded=1;whiteSpace=wrap;html=1;fontSize=11;glass=0;strokeWidth=1;shadow=0;" parent="WIyWlLk6GJQsqaUBKTNV-1" vertex="1">
<mxGeometry x="138.5" y="560" width="120" height="40" as="geometry" />
</mxCell>
<mxCell id="WIyWlLk6GJQsqaUBKTNV-12" value="<font style="font-size: 10px">인용문<br></font><font style="font-size: 9px">(n = 2,292)</font>" style="rounded=1;whiteSpace=wrap;html=1;fontSize=11;glass=0;strokeWidth=1;shadow=0;" parent="WIyWlLk6GJQsqaUBKTNV-1" vertex="1">
<mxGeometry x="314" y="340" width="80" height="40" as="geometry" />
</mxCell>
<mxCell id="o_Thwpqc5d8Y5QQ_MUpu-1" value="" style="endArrow=classic;html=1;exitX=1;exitY=0.5;exitDx=0;exitDy=0;entryX=0;entryY=0.5;entryDx=0;entryDy=0;" parent="WIyWlLk6GJQsqaUBKTNV-1" source="WIyWlLk6GJQsqaUBKTNV-11" target="o_Thwpqc5d8Y5QQ_MUpu-2" edge="1">
<mxGeometry width="50" height="50" relative="1" as="geometry">
<mxPoint x="344" y="490" as="sourcePoint" />
<mxPoint x="444" y="210" as="targetPoint" />
<Array as="points">
<mxPoint x="400" y="580" />
<mxPoint x="404" y="570" />
<mxPoint x="404" y="140" />
<mxPoint x="404" y="130" />
</Array>
</mxGeometry>
</mxCell>
<mxCell id="o_Thwpqc5d8Y5QQ_MUpu-2" value="<font style="font-size: 10px">형태소 분석 및 명사 추출<br></font><font style="font-size: 9px">(n = 47,251)</font>" style="rounded=1;whiteSpace=wrap;html=1;fontSize=11;" parent="WIyWlLk6GJQsqaUBKTNV-1" vertex="1">
<mxGeometry x="420" y="100" width="120" height="60" as="geometry" />
</mxCell>
<mxCell id="o_Thwpqc5d8Y5QQ_MUpu-3" value="작업" style="rounded=0;html=1;jettySize=auto;orthogonalLoop=1;fontSize=11;endArrow=block;endFill=0;endSize=8;strokeWidth=1;shadow=0;labelBackgroundColor=none;edgeStyle=orthogonalEdgeStyle;" parent="WIyWlLk6GJQsqaUBKTNV-1" source="o_Thwpqc5d8Y5QQ_MUpu-5" target="o_Thwpqc5d8Y5QQ_MUpu-9" edge="1">
<mxGeometry x="-0.3333" y="16" relative="1" as="geometry">
<mxPoint as="offset" />
<Array as="points">
<mxPoint x="480" y="290" />
<mxPoint x="480" y="290" />
</Array>
</mxGeometry>
</mxCell>
<mxCell id="o_Thwpqc5d8Y5QQ_MUpu-4" value="결과" style="edgeStyle=orthogonalEdgeStyle;rounded=0;html=1;jettySize=auto;orthogonalLoop=1;fontSize=9;endArrow=block;endFill=0;endSize=8;strokeWidth=1;shadow=0;labelBackgroundColor=none;" parent="WIyWlLk6GJQsqaUBKTNV-1" source="o_Thwpqc5d8Y5QQ_MUpu-5" target="o_Thwpqc5d8Y5QQ_MUpu-6" edge="1">
<mxGeometry y="10" relative="1" as="geometry">
<mxPoint as="offset" />
</mxGeometry>
</mxCell>
<mxCell id="o_Thwpqc5d8Y5QQ_MUpu-5" value="<font style="font-size: 10px">1차 정제<br></font><font style="font-size: 8px">명사길이: 1 &lt; k ≤ 10<br></font>" style="rhombus;whiteSpace=wrap;html=1;shadow=0;fontFamily=Helvetica;fontSize=11;align=center;strokeWidth=1;spacing=6;spacingTop=-4;" parent="WIyWlLk6GJQsqaUBKTNV-1" vertex="1">
<mxGeometry x="430" y="200" width="100" height="80" as="geometry" />
</mxCell>
<mxCell id="o_Thwpqc5d8Y5QQ_MUpu-6" value="<font style="font-size: 10px">명사<br></font><font style="font-size: 9px">(n = 35,538)</font>" style="rounded=1;whiteSpace=wrap;html=1;fontSize=11;glass=0;strokeWidth=1;shadow=0;" parent="WIyWlLk6GJQsqaUBKTNV-1" vertex="1">
<mxGeometry x="570" y="220" width="80" height="40" as="geometry" />
</mxCell>
<mxCell id="o_Thwpqc5d8Y5QQ_MUpu-7" value="작업" style="rounded=0;html=1;jettySize=auto;orthogonalLoop=1;fontSize=11;endArrow=block;endFill=0;endSize=8;strokeWidth=1;shadow=0;labelBackgroundColor=none;edgeStyle=orthogonalEdgeStyle;" parent="WIyWlLk6GJQsqaUBKTNV-1" source="o_Thwpqc5d8Y5QQ_MUpu-9" target="o_Thwpqc5d8Y5QQ_MUpu-14" edge="1">
<mxGeometry y="20" relative="1" as="geometry">
<mxPoint as="offset" />
</mxGeometry>
</mxCell>
<mxCell id="o_Thwpqc5d8Y5QQ_MUpu-8" value="결과" style="edgeStyle=orthogonalEdgeStyle;rounded=0;html=1;jettySize=auto;orthogonalLoop=1;fontSize=9;endArrow=block;endFill=0;endSize=8;strokeWidth=1;shadow=0;labelBackgroundColor=none;" parent="WIyWlLk6GJQsqaUBKTNV-1" source="o_Thwpqc5d8Y5QQ_MUpu-9" target="o_Thwpqc5d8Y5QQ_MUpu-11" edge="1">
<mxGeometry y="10" relative="1" as="geometry">
<mxPoint as="offset" />
</mxGeometry>
</mxCell>
<mxCell id="o_Thwpqc5d8Y5QQ_MUpu-9" value="<font style="font-size: 10px">2차 정제<br></font><font style="font-size: 8px">불용어 처리<br>단어 통합<br></font>" style="rhombus;whiteSpace=wrap;html=1;shadow=0;fontFamily=Helvetica;fontSize=11;align=center;strokeWidth=1;spacing=6;spacingTop=-4;" parent="WIyWlLk6GJQsqaUBKTNV-1" vertex="1">
<mxGeometry x="430" y="320" width="100" height="80" as="geometry" />
</mxCell>
<mxCell id="o_Thwpqc5d8Y5QQ_MUpu-10" value="n = 30,702" style="rounded=1;whiteSpace=wrap;html=1;fontSize=11;glass=0;strokeWidth=1;shadow=0;" parent="WIyWlLk6GJQsqaUBKTNV-1" vertex="1">
<mxGeometry x="420" y="560" width="120" height="40" as="geometry" />
</mxCell>
<mxCell id="o_Thwpqc5d8Y5QQ_MUpu-11" value="<font style="font-size: 10px">명사<br></font><font style="font-size: 9px">(n = 33,527)</font>" style="rounded=1;whiteSpace=wrap;html=1;fontSize=11;glass=0;strokeWidth=1;shadow=0;" parent="WIyWlLk6GJQsqaUBKTNV-1" vertex="1">
<mxGeometry x="570" y="340" width="80" height="40" as="geometry" />
</mxCell>
<mxCell id="o_Thwpqc5d8Y5QQ_MUpu-12" value="" style="rounded=0;html=1;jettySize=auto;orthogonalLoop=1;fontSize=11;endArrow=block;endFill=0;endSize=8;strokeWidth=1;shadow=0;labelBackgroundColor=none;edgeStyle=orthogonalEdgeStyle;entryX=0.5;entryY=0;entryDx=0;entryDy=0;" parent="WIyWlLk6GJQsqaUBKTNV-1" target="o_Thwpqc5d8Y5QQ_MUpu-5" edge="1">
<mxGeometry relative="1" as="geometry">
<mxPoint x="479.71" y="160" as="sourcePoint" />
<mxPoint x="480" y="190" as="targetPoint" />
</mxGeometry>
</mxCell>
<mxCell id="o_Thwpqc5d8Y5QQ_MUpu-14" value="<font style="font-size: 10px">3차 정제<br></font><font style="font-size: 8px">빈도수 2 ≤ k<br></font>" style="rhombus;whiteSpace=wrap;html=1;shadow=0;fontFamily=Helvetica;fontSize=11;align=center;strokeWidth=1;spacing=6;spacingTop=-4;" parent="WIyWlLk6GJQsqaUBKTNV-1" vertex="1">
<mxGeometry x="430" y="440" width="100" height="80" as="geometry" />
</mxCell>
<mxCell id="o_Thwpqc5d8Y5QQ_MUpu-17" value="결과" style="edgeStyle=orthogonalEdgeStyle;rounded=0;html=1;jettySize=auto;orthogonalLoop=1;fontSize=9;endArrow=block;endFill=0;endSize=8;strokeWidth=1;shadow=0;labelBackgroundColor=none;" parent="WIyWlLk6GJQsqaUBKTNV-1" target="o_Thwpqc5d8Y5QQ_MUpu-18" edge="1">
<mxGeometry y="10" relative="1" as="geometry">
<mxPoint as="offset" />
<mxPoint x="529.9999999999999" y="480.0000000000001" as="sourcePoint" />
<Array as="points">
<mxPoint x="550" y="480" />
<mxPoint x="550" y="480" />
</Array>
</mxGeometry>
</mxCell>
<mxCell id="o_Thwpqc5d8Y5QQ_MUpu-18" value="<font style="font-size: 10px">명사<br></font><font style="font-size: 9px">(n = 30,702)</font>" style="rounded=1;whiteSpace=wrap;html=1;fontSize=11;glass=0;strokeWidth=1;shadow=0;" parent="WIyWlLk6GJQsqaUBKTNV-1" vertex="1">
<mxGeometry x="570" y="460" width="80" height="40" as="geometry" />
</mxCell>
<mxCell id="o_Thwpqc5d8Y5QQ_MUpu-24" value="최종" style="rounded=0;html=1;jettySize=auto;orthogonalLoop=1;fontSize=11;endArrow=block;endFill=0;endSize=8;strokeWidth=1;shadow=0;labelBackgroundColor=none;edgeStyle=orthogonalEdgeStyle;" parent="WIyWlLk6GJQsqaUBKTNV-1" edge="1">
<mxGeometry y="20" relative="1" as="geometry">
<mxPoint as="offset" />
<mxPoint x="479.5800000000001" y="519.9999999999999" as="sourcePoint" />
<mxPoint x="479.5800000000001" y="560.0000000000001" as="targetPoint" />
</mxGeometry>
</mxCell>
<mxCell id="AkGz2d8EXF-ztuJMse4d-0" value="결과" style="edgeStyle=orthogonalEdgeStyle;rounded=0;html=1;jettySize=auto;orthogonalLoop=1;fontSize=9;endArrow=block;endFill=0;endSize=8;strokeWidth=1;shadow=0;labelBackgroundColor=none;exitX=1;exitY=0.5;exitDx=0;exitDy=0;" parent="WIyWlLk6GJQsqaUBKTNV-1" source="WIyWlLk6GJQsqaUBKTNV-3" target="AkGz2d8EXF-ztuJMse4d-1" edge="1">
<mxGeometry y="10" relative="1" as="geometry">
<mxPoint as="offset" />
<mxPoint x="270" y="130" as="sourcePoint" />
</mxGeometry>
</mxCell>
<mxCell id="AkGz2d8EXF-ztuJMse4d-1" value="<font style="font-size: 10px">언론기사<br></font><span style="font-size: 9px">(n = 1,306)</span>" style="rounded=1;whiteSpace=wrap;html=1;fontSize=11;glass=0;strokeWidth=1;shadow=0;" parent="WIyWlLk6GJQsqaUBKTNV-1" vertex="1">
<mxGeometry x="310" y="110" width="80" height="40" as="geometry" />
</mxCell>
<mxCell id="TpO_H_RYObl5JqrHC5Rp-0" value="결과" style="edgeStyle=orthogonalEdgeStyle;rounded=0;html=1;jettySize=auto;orthogonalLoop=1;fontSize=9;endArrow=block;endFill=0;endSize=8;strokeWidth=1;shadow=0;labelBackgroundColor=none;" parent="WIyWlLk6GJQsqaUBKTNV-1" source="TpO_H_RYObl5JqrHC5Rp-1" target="TpO_H_RYObl5JqrHC5Rp-2" edge="1">
<mxGeometry y="10" relative="1" as="geometry">
<mxPoint as="offset" />
</mxGeometry>
</mxCell>
<mxCell id="TpO_H_RYObl5JqrHC5Rp-3" value="" style="edgeStyle=orthogonalEdgeStyle;rounded=0;orthogonalLoop=1;jettySize=auto;html=1;" parent="WIyWlLk6GJQsqaUBKTNV-1" source="TpO_H_RYObl5JqrHC5Rp-1" target="WIyWlLk6GJQsqaUBKTNV-11" edge="1">
<mxGeometry relative="1" as="geometry" />
</mxCell>
<mxCell id="TpO_H_RYObl5JqrHC5Rp-4" value="최종" style="edgeLabel;html=1;align=center;verticalAlign=middle;resizable=0;points=[];" parent="TpO_H_RYObl5JqrHC5Rp-3" vertex="1" connectable="0">
<mxGeometry x="-0.2" relative="1" as="geometry">
<mxPoint x="21" y="4" as="offset" />
</mxGeometry>
</mxCell>
<mxCell id="TpO_H_RYObl5JqrHC5Rp-1" value="<font style="font-size: 10px">데이터 2차 정제<br></font><span style="font-size: 8px">발언 3회 이하 행위자 제거<br>무관한 인용문 제거<br></span>" style="rhombus;whiteSpace=wrap;html=1;shadow=0;fontFamily=Helvetica;fontSize=11;align=center;strokeWidth=1;spacing=6;spacingTop=-4;" parent="WIyWlLk6GJQsqaUBKTNV-1" vertex="1">
<mxGeometry x="139.25" y="440" width="118.5" height="80" as="geometry" />
</mxCell>
<mxCell id="TpO_H_RYObl5JqrHC5Rp-2" value="<font style="font-size: 10px">인용문<br></font><font style="font-size: 9px">(n = 1,499)</font>" style="rounded=1;whiteSpace=wrap;html=1;fontSize=11;glass=0;strokeWidth=1;shadow=0;" parent="WIyWlLk6GJQsqaUBKTNV-1" vertex="1">
<mxGeometry x="314" y="460" width="80" height="40" as="geometry" />
</mxCell>
</root>
</mxGraphModel>
</diagram>
</mxfile>