<?xml version="1.0" encoding="UTF-8"?>
<rss version="2.0">
  <channel>
    <title>Allen's 데이터 맛집</title>
    <link>https://allensdatablog.tistory.com/</link>
    <description>데이터 분석가가 기록하는 기술 블로그</description>
    <language>ko</language>
    <pubDate>Thu, 16 Apr 2026 12:37:53 +0900</pubDate>
    <generator>TISTORY</generator>
    <ttl>100</ttl>
    <managingEditor>Allen93</managingEditor>
    <image>
      <title>Allen's 데이터 맛집</title>
      <url>https://tistory1.daumcdn.net/tistory/6485337/attach/57b1d64b598c475a90b683c23ef0383f</url>
      <link>https://allensdatablog.tistory.com</link>
    </image>
    <item>
      <title>BIC란 무엇인가 &amp;mdash; AIC와 무엇이 다를까?</title>
      <link>https://allensdatablog.tistory.com/entry/BIC%EB%9E%80-%EB%AC%B4%EC%97%87%EC%9D%B8%EA%B0%80-%E2%80%94-AIC%EC%99%80-%EB%AC%B4%EC%97%87%EC%9D%B4-%EB%8B%A4%EB%A5%BC%EA%B9%8C</link>
      <description>&lt;p data-end=&quot;240&quot; data-start=&quot;196&quot; data-ke-size=&quot;size16&quot;&gt;모델을 선택할 때 AIC를 사용했다면,&lt;br /&gt;거의 반드시 이런 질문이 따라옵니다.&lt;/p&gt;
&lt;blockquote data-end=&quot;266&quot; data-start=&quot;242&quot; data-ke-style=&quot;style1&quot;&gt;
&lt;p data-end=&quot;266&quot; data-start=&quot;244&quot; data-ke-size=&quot;size16&quot;&gt;&amp;ldquo;BIC도 있다는데&amp;hellip; 뭐가 다른 거지?&amp;rdquo;&lt;/p&gt;
&lt;/blockquote&gt;
&lt;p data-end=&quot;285&quot; data-start=&quot;268&quot; data-ke-size=&quot;size16&quot;&gt;결론부터 아주 간단하게 말하면:&lt;/p&gt;
&lt;blockquote data-end=&quot;331&quot; data-start=&quot;287&quot; data-ke-style=&quot;style1&quot;&gt;
&lt;p data-end=&quot;331&quot; data-start=&quot;289&quot; data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;AIC는 예측 중심,&lt;br /&gt;BIC는 &amp;lsquo;진짜 모델 찾기&amp;rsquo; 중심입니다.&lt;br /&gt;&lt;br /&gt;&lt;/b&gt;&lt;/p&gt;
&lt;figure class=&quot;imageblock alignCenter&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;1536&quot; data-origin-height=&quot;1024&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/bAEWz1/dJMcahYigk2/vPaauOLN1p2udPkIzRwpl1/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/bAEWz1/dJMcahYigk2/vPaauOLN1p2udPkIzRwpl1/img.png&quot; data-alt=&quot;BIC&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/bAEWz1/dJMcahYigk2/vPaauOLN1p2udPkIzRwpl1/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2FbAEWz1%2FdJMcahYigk2%2FvPaauOLN1p2udPkIzRwpl1%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;1536&quot; height=&quot;1024&quot; data-origin-width=&quot;1536&quot; data-origin-height=&quot;1024&quot;/&gt;&lt;/span&gt;&lt;figcaption&gt;BIC&lt;/figcaption&gt;
&lt;/figure&gt;

&lt;p data-end=&quot;331&quot; data-start=&quot;289&quot; data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;&amp;nbsp;&lt;/b&gt;&lt;/p&gt;
&lt;/blockquote&gt;
&lt;hr data-end=&quot;336&quot; data-start=&quot;333&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h1 data-end=&quot;353&quot; data-start=&quot;338&quot; data-section-id=&quot;1nooqu3&quot;&gt;1) BIC의 핵심 개념&lt;/h1&gt;
&lt;p data-end=&quot;376&quot; data-start=&quot;355&quot; data-ke-size=&quot;size16&quot;&gt;BIC도 AIC와 동일한 출발점입니다.&lt;/p&gt;
&lt;blockquote data-end=&quot;394&quot; data-start=&quot;378&quot; data-ke-style=&quot;style1&quot;&gt;
&lt;p data-end=&quot;394&quot; data-start=&quot;380&quot; data-ke-size=&quot;size16&quot;&gt;&amp;ldquo;좋은 모델은 무엇인가?&amp;rdquo;&lt;/p&gt;
&lt;/blockquote&gt;
&lt;p data-end=&quot;419&quot; data-start=&quot;396&quot; data-ke-size=&quot;size16&quot;&gt;하지만 BIC는 조금 더 강하게 말합니다.&lt;/p&gt;
&lt;blockquote data-end=&quot;447&quot; data-start=&quot;421&quot; data-ke-style=&quot;style1&quot;&gt;
&lt;p data-end=&quot;447&quot; data-start=&quot;423&quot; data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;&amp;ldquo;불필요한 변수는 최대한 제거하자.&amp;rdquo;&lt;/b&gt;&lt;/p&gt;
&lt;/blockquote&gt;
&lt;p data-end=&quot;451&quot; data-start=&quot;449&quot; data-ke-size=&quot;size16&quot;&gt;즉,&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;497&quot; data-start=&quot;453&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;469&quot; data-start=&quot;453&quot; data-section-id=&quot;br2tht&quot;&gt;AIC &amp;rarr; 적당히 유연&lt;/li&gt;
&lt;li data-end=&quot;497&quot; data-start=&quot;470&quot; data-section-id=&quot;ugniv2&quot;&gt;BIC &amp;rarr; 더 보수적 (더 단순한 모델 선호)&lt;/li&gt;
&lt;/ul&gt;
&lt;hr data-end=&quot;502&quot; data-start=&quot;499&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h1 data-end=&quot;526&quot; data-start=&quot;504&quot; data-section-id=&quot;nkqzs1&quot;&gt;2) BIC 공식 (직관 중심 설명)&lt;/h1&gt;
&lt;blockquote data-ke-style=&quot;style3&quot;&gt;BIC=ln⁡(n)&amp;sdot;k&amp;minus;2ln⁡(L)&lt;/blockquote&gt;
&lt;p data-end=&quot;577&quot; data-start=&quot;566&quot; data-ke-size=&quot;size16&quot;&gt;AIC와 비교해보면:&lt;/p&gt;
&lt;div&gt;
&lt;div&gt;&lt;b&gt;항목&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;AIC&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; BIC&lt;/b&gt;
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-end=&quot;647&quot; data-start=&quot;579&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody data-end=&quot;647&quot; data-start=&quot;621&quot;&gt;
&lt;tr data-end=&quot;647&quot; data-start=&quot;621&quot;&gt;
&lt;td data-col-size=&quot;sm&quot; data-end=&quot;631&quot; data-start=&quot;621&quot;&gt;복잡도 패널티&lt;/td&gt;
&lt;td data-col-size=&quot;sm&quot; data-end=&quot;636&quot; data-start=&quot;631&quot;&gt;2k&lt;/td&gt;
&lt;td data-col-size=&quot;sm&quot; data-end=&quot;647&quot; data-start=&quot;636&quot;&gt;ln(n)&amp;middot;k&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;/div&gt;
&lt;/div&gt;
&lt;hr data-end=&quot;652&quot; data-start=&quot;649&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h3 data-end=&quot;665&quot; data-start=&quot;654&quot; data-section-id=&quot;j5g7vb&quot; data-ke-size=&quot;size23&quot;&gt;✔ 핵심 차이&lt;/h3&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;707&quot; data-start=&quot;667&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;684&quot; data-start=&quot;667&quot; data-section-id=&quot;ovcvkl&quot;&gt;AIC: 패널티 = 2k&lt;/li&gt;
&lt;li data-end=&quot;707&quot; data-start=&quot;685&quot; data-section-id=&quot;lm7d32&quot;&gt;BIC: 패널티 = ln(n)&amp;middot;k&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-end=&quot;735&quot; data-start=&quot;709&quot; data-ke-size=&quot;size16&quot;&gt;  여기서 중요한 건 &lt;b&gt;ln(n)&lt;/b&gt;입니다.&lt;/p&gt;
&lt;hr data-end=&quot;740&quot; data-start=&quot;737&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h1 data-end=&quot;761&quot; data-start=&quot;742&quot; data-section-id=&quot;16h6vzz&quot;&gt;3) 왜 ln(n)이 중요한가?&lt;/h1&gt;
&lt;p data-end=&quot;772&quot; data-start=&quot;763&quot; data-ke-size=&quot;size16&quot;&gt;n = 표본 크기&lt;/p&gt;
&lt;p data-end=&quot;780&quot; data-start=&quot;774&quot; data-ke-size=&quot;size16&quot;&gt;예를 들어:&lt;/p&gt;
&lt;div&gt;
&lt;div&gt;&lt;b&gt;n&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;ln(n)&lt;/b&gt;
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-end=&quot;853&quot; data-start=&quot;782&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody data-end=&quot;853&quot; data-start=&quot;812&quot;&gt;
&lt;tr data-end=&quot;824&quot; data-start=&quot;812&quot;&gt;
&lt;td data-col-size=&quot;sm&quot; data-end=&quot;817&quot; data-start=&quot;812&quot;&gt;10&lt;/td&gt;
&lt;td data-col-size=&quot;sm&quot; data-end=&quot;824&quot; data-start=&quot;817&quot;&gt;2.3&lt;/td&gt;
&lt;/tr&gt;
&lt;tr data-end=&quot;838&quot; data-start=&quot;825&quot;&gt;
&lt;td data-col-size=&quot;sm&quot; data-end=&quot;831&quot; data-start=&quot;825&quot;&gt;100&lt;/td&gt;
&lt;td data-end=&quot;838&quot; data-start=&quot;831&quot; data-col-size=&quot;sm&quot;&gt;4.6&lt;/td&gt;
&lt;/tr&gt;
&lt;tr data-end=&quot;853&quot; data-start=&quot;839&quot;&gt;
&lt;td data-col-size=&quot;sm&quot; data-end=&quot;846&quot; data-start=&quot;839&quot;&gt;1000&lt;/td&gt;
&lt;td data-end=&quot;853&quot; data-start=&quot;846&quot; data-col-size=&quot;sm&quot;&gt;6.9&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;/div&gt;
&lt;/div&gt;
&lt;p data-end=&quot;857&quot; data-start=&quot;855&quot; data-ke-size=&quot;size16&quot;&gt;즉,&lt;/p&gt;
&lt;blockquote data-end=&quot;901&quot; data-start=&quot;859&quot; data-ke-style=&quot;style1&quot;&gt;
&lt;p data-end=&quot;901&quot; data-start=&quot;861&quot; data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;데이터가 많아질수록 BIC는 변수 추가를 더 강하게 벌점 줍니다.&lt;/b&gt;&lt;/p&gt;
&lt;/blockquote&gt;
&lt;hr data-end=&quot;906&quot; data-start=&quot;903&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h3 data-end=&quot;916&quot; data-start=&quot;908&quot; data-section-id=&quot;14j1iky&quot; data-ke-size=&quot;size23&quot;&gt;✔ 의미&lt;/h3&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;962&quot; data-start=&quot;918&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;962&quot; data-start=&quot;918&quot; data-section-id=&quot;udb6ue&quot;&gt;데이터 많음 &amp;rarr; 모델 확신 높음&lt;br /&gt;&amp;rarr; 불필요한 변수는 더 엄격하게 제거&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-end=&quot;1003&quot; data-start=&quot;964&quot; data-ke-size=&quot;size16&quot;&gt;  그래서 BIC는 &amp;ldquo;진짜 필요한 변수만 남기려는 성향&amp;rdquo;이 강합니다.&lt;/p&gt;
&lt;hr data-end=&quot;1008&quot; data-start=&quot;1005&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h1 data-end=&quot;1027&quot; data-start=&quot;1010&quot; data-section-id=&quot;1s8rcca&quot;&gt;4) 자동차 예시로 이해하기&lt;/h1&gt;
&lt;p data-end=&quot;1046&quot; data-start=&quot;1029&quot; data-ke-size=&quot;size16&quot;&gt;연비 모델을 만든다고 해봅시다.&lt;/p&gt;
&lt;h3 data-end=&quot;1058&quot; data-start=&quot;1048&quot; data-section-id=&quot;1758nzr&quot; data-ke-size=&quot;size23&quot;&gt;모델 A&lt;/h3&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;1096&quot; data-start=&quot;1059&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;1068&quot; data-start=&quot;1059&quot; data-section-id=&quot;o4qzi6&quot;&gt;변수 2개&lt;/li&gt;
&lt;li data-end=&quot;1082&quot; data-start=&quot;1069&quot; data-section-id=&quot;1in8d1j&quot;&gt;AIC = 180&lt;/li&gt;
&lt;li data-end=&quot;1096&quot; data-start=&quot;1083&quot; data-section-id=&quot;1bw1het&quot;&gt;BIC = 190&lt;/li&gt;
&lt;/ul&gt;
&lt;h3 data-end=&quot;1108&quot; data-start=&quot;1098&quot; data-section-id=&quot;1758juc&quot; data-ke-size=&quot;size23&quot;&gt;모델 B&lt;/h3&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;1146&quot; data-start=&quot;1109&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;1118&quot; data-start=&quot;1109&quot; data-section-id=&quot;o4tvp6&quot;&gt;변수 6개&lt;/li&gt;
&lt;li data-end=&quot;1132&quot; data-start=&quot;1119&quot; data-section-id=&quot;1inasfh&quot;&gt;AIC = 175&lt;/li&gt;
&lt;li data-end=&quot;1146&quot; data-start=&quot;1133&quot; data-section-id=&quot;1bwx0oe&quot;&gt;BIC = 210&lt;/li&gt;
&lt;/ul&gt;
&lt;hr data-end=&quot;1151&quot; data-start=&quot;1148&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h3 data-end=&quot;1159&quot; data-start=&quot;1153&quot; data-section-id=&quot;1hrnne7&quot; data-ke-size=&quot;size23&quot;&gt;해석&lt;/h3&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;1196&quot; data-start=&quot;1161&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;1178&quot; data-start=&quot;1161&quot; data-section-id=&quot;m3hmm&quot;&gt;AIC &amp;rarr; 모델 B 선택&lt;/li&gt;
&lt;li data-end=&quot;1196&quot; data-start=&quot;1179&quot; data-section-id=&quot;19f5f6m&quot;&gt;BIC &amp;rarr; 모델 A 선택&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-end=&quot;1200&quot; data-start=&quot;1198&quot; data-ke-size=&quot;size16&quot;&gt;왜?&lt;/p&gt;
&lt;p data-end=&quot;1244&quot; data-start=&quot;1202&quot; data-ke-size=&quot;size16&quot;&gt;  BIC는&lt;br /&gt;&amp;ldquo;변수가 너무 많다 &amp;rarr; 과적합 위험&amp;rdquo;&lt;br /&gt;이라고 판단한 것&lt;/p&gt;
&lt;hr data-end=&quot;1249&quot; data-start=&quot;1246&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h1 data-end=&quot;1277&quot; data-start=&quot;1251&quot; data-section-id=&quot;1u5yfhw&quot;&gt;5) AIC vs BIC &amp;mdash; 핵심 차이 정리&lt;/h1&gt;
&lt;div&gt;
&lt;div&gt;&lt;b&gt;구분&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; AIC&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; BIC&lt;/b&gt;
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-end=&quot;1443&quot; data-start=&quot;1279&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody data-end=&quot;1443&quot; data-start=&quot;1321&quot;&gt;
&lt;tr data-end=&quot;1346&quot; data-start=&quot;1321&quot;&gt;
&lt;td data-col-size=&quot;sm&quot; data-end=&quot;1326&quot; data-start=&quot;1321&quot;&gt;목적&lt;/td&gt;
&lt;td data-col-size=&quot;sm&quot; data-end=&quot;1334&quot; data-start=&quot;1326&quot;&gt;예측 성능&lt;/td&gt;
&lt;td data-col-size=&quot;sm&quot; data-end=&quot;1346&quot; data-start=&quot;1334&quot;&gt;진짜 모델 찾기&lt;/td&gt;
&lt;/tr&gt;
&lt;tr data-end=&quot;1364&quot; data-start=&quot;1347&quot;&gt;
&lt;td data-col-size=&quot;sm&quot; data-end=&quot;1353&quot; data-start=&quot;1347&quot;&gt;패널티&lt;/td&gt;
&lt;td data-col-size=&quot;sm&quot; data-end=&quot;1358&quot; data-start=&quot;1353&quot;&gt;약함&lt;/td&gt;
&lt;td data-col-size=&quot;sm&quot; data-end=&quot;1364&quot; data-start=&quot;1358&quot;&gt;강함&lt;/td&gt;
&lt;/tr&gt;
&lt;tr data-end=&quot;1396&quot; data-start=&quot;1365&quot;&gt;
&lt;td data-col-size=&quot;sm&quot; data-end=&quot;1373&quot; data-start=&quot;1365&quot;&gt;변수 선택&lt;/td&gt;
&lt;td data-col-size=&quot;sm&quot; data-end=&quot;1385&quot; data-start=&quot;1373&quot;&gt;비교적 많이 포함&lt;/td&gt;
&lt;td data-col-size=&quot;sm&quot; data-end=&quot;1396&quot; data-start=&quot;1385&quot;&gt;최소한만 포함&lt;/td&gt;
&lt;/tr&gt;
&lt;tr data-end=&quot;1426&quot; data-start=&quot;1397&quot;&gt;
&lt;td data-col-size=&quot;sm&quot; data-end=&quot;1408&quot; data-start=&quot;1397&quot;&gt;데이터 많을수록&lt;/td&gt;
&lt;td data-col-size=&quot;sm&quot; data-end=&quot;1416&quot; data-start=&quot;1408&quot;&gt;영향 적음&lt;/td&gt;
&lt;td data-end=&quot;1426&quot; data-start=&quot;1416&quot; data-col-size=&quot;sm&quot;&gt;매우 보수적&lt;/td&gt;
&lt;/tr&gt;
&lt;tr data-end=&quot;1443&quot; data-start=&quot;1427&quot;&gt;
&lt;td data-col-size=&quot;sm&quot; data-end=&quot;1432&quot; data-start=&quot;1427&quot;&gt;성향&lt;/td&gt;
&lt;td data-col-size=&quot;sm&quot; data-end=&quot;1437&quot; data-start=&quot;1432&quot;&gt;유연&lt;/td&gt;
&lt;td data-col-size=&quot;sm&quot; data-end=&quot;1443&quot; data-start=&quot;1437&quot;&gt;엄격&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;/div&gt;
&lt;/div&gt;
&lt;hr data-end=&quot;1448&quot; data-start=&quot;1445&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h1 data-end=&quot;1477&quot; data-start=&quot;1450&quot; data-section-id=&quot;wm1cct&quot;&gt;6) 언제 AIC, 언제 BIC를 써야 할까?&lt;/h1&gt;
&lt;p data-end=&quot;1500&quot; data-start=&quot;1479&quot; data-ke-size=&quot;size16&quot;&gt;이건 실무에서 매우 중요한 질문입니다.&lt;/p&gt;
&lt;hr data-end=&quot;1505&quot; data-start=&quot;1502&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;1522&quot; data-start=&quot;1507&quot; data-section-id=&quot;4wo3lo&quot; data-ke-size=&quot;size26&quot;&gt;✔ AIC가 좋은 경우&lt;/h2&gt;
&lt;p data-end=&quot;1541&quot; data-start=&quot;1524&quot; data-ke-size=&quot;size16&quot;&gt;  &lt;b&gt;예측 모델 만들 때&lt;/b&gt;&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;1594&quot; data-start=&quot;1543&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;1556&quot; data-start=&quot;1543&quot; data-section-id=&quot;1g0fcsp&quot;&gt;머신러닝 전 단계&lt;/li&gt;
&lt;li data-end=&quot;1570&quot; data-start=&quot;1557&quot; data-section-id=&quot;dugem4&quot;&gt;실제 서비스 모델&lt;/li&gt;
&lt;li data-end=&quot;1581&quot; data-start=&quot;1571&quot; data-section-id=&quot;16v1nz8&quot;&gt;추천 시스템&lt;/li&gt;
&lt;li data-end=&quot;1594&quot; data-start=&quot;1582&quot; data-section-id=&quot;61hi41&quot;&gt;품질 예측 모델&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-end=&quot;1621&quot; data-start=&quot;1596&quot; data-ke-size=&quot;size16&quot;&gt;&amp;rarr; 약간 과적합이어도 예측이 잘 되면 OK&lt;/p&gt;
&lt;hr data-end=&quot;1626&quot; data-start=&quot;1623&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;1643&quot; data-start=&quot;1628&quot; data-section-id=&quot;z7gejj&quot; data-ke-size=&quot;size26&quot;&gt;✔ BIC가 좋은 경우&lt;/h2&gt;
&lt;p data-end=&quot;1665&quot; data-start=&quot;1645&quot; data-ke-size=&quot;size16&quot;&gt;  &lt;b&gt;설명 모델 / 원인 분석&lt;/b&gt;&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;1712&quot; data-start=&quot;1667&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;1679&quot; data-start=&quot;1667&quot; data-section-id=&quot;t4lpct&quot;&gt;변수 영향 해석&lt;/li&gt;
&lt;li data-end=&quot;1689&quot; data-start=&quot;1680&quot; data-section-id=&quot;1v66qux&quot;&gt;원인 규명&lt;/li&gt;
&lt;li data-end=&quot;1699&quot; data-start=&quot;1690&quot; data-section-id=&quot;1ocgbpj&quot;&gt;논문&amp;middot;연구&lt;/li&gt;
&lt;li data-end=&quot;1712&quot; data-start=&quot;1700&quot; data-section-id=&quot;1glq7vd&quot;&gt;공정 원인 분석&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-end=&quot;1735&quot; data-start=&quot;1714&quot; data-ke-size=&quot;size16&quot;&gt;&amp;rarr; &amp;ldquo;진짜 필요한 변수만 남기고 싶다&amp;rdquo;&lt;/p&gt;
&lt;hr data-end=&quot;1740&quot; data-start=&quot;1737&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h1 data-end=&quot;1766&quot; data-start=&quot;1742&quot; data-section-id=&quot;6irb91&quot;&gt;7) 직관적으로 이해하는 가장 쉬운 방법&lt;/h1&gt;
&lt;p data-end=&quot;1785&quot; data-start=&quot;1768&quot; data-ke-size=&quot;size16&quot;&gt;이렇게 생각하면 가장 쉽습니다.&lt;/p&gt;
&lt;hr data-end=&quot;1790&quot; data-start=&quot;1787&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h3 data-end=&quot;1802&quot; data-start=&quot;1792&quot; data-section-id=&quot;xac3q6&quot; data-ke-size=&quot;size23&quot;&gt;  AIC&lt;/h3&gt;
&lt;blockquote data-end=&quot;1834&quot; data-start=&quot;1804&quot; data-ke-style=&quot;style1&quot;&gt;
&lt;p data-end=&quot;1834&quot; data-start=&quot;1806&quot; data-ke-size=&quot;size16&quot;&gt;&amp;ldquo;좀 복잡해도 괜찮으니까, 예측 잘 되는 모델 줘&amp;rdquo;&lt;/p&gt;
&lt;/blockquote&gt;
&lt;hr data-end=&quot;1839&quot; data-start=&quot;1836&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h3 data-end=&quot;1851&quot; data-start=&quot;1841&quot; data-section-id=&quot;xac671&quot; data-ke-size=&quot;size23&quot;&gt;  BIC&lt;/h3&gt;
&lt;blockquote data-end=&quot;1883&quot; data-start=&quot;1853&quot; data-ke-style=&quot;style1&quot;&gt;
&lt;p data-end=&quot;1883&quot; data-start=&quot;1855&quot; data-ke-size=&quot;size16&quot;&gt;&amp;ldquo;쓸데없는 변수 다 빼고, 진짜 중요한 것만 남겨&amp;rdquo;&lt;/p&gt;
&lt;/blockquote&gt;
&lt;hr data-end=&quot;1888&quot; data-start=&quot;1885&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h1 data-end=&quot;1913&quot; data-start=&quot;1890&quot; data-section-id=&quot;syp5dz&quot;&gt;8) 실제 데이터 분석 흐름에서의 사용&lt;/h1&gt;
&lt;p data-end=&quot;1932&quot; data-start=&quot;1915&quot; data-ke-size=&quot;size16&quot;&gt;실무에서는 이렇게 많이 씁니다.&lt;/p&gt;
&lt;hr data-end=&quot;1937&quot; data-start=&quot;1934&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h3 data-end=&quot;1953&quot; data-start=&quot;1939&quot; data-section-id=&quot;12a4vbl&quot; data-ke-size=&quot;size23&quot;&gt;✔ Step 1&lt;/h3&gt;
&lt;p data-end=&quot;1962&quot; data-start=&quot;1954&quot; data-ke-size=&quot;size16&quot;&gt;여러 모델 생성&lt;/p&gt;
&lt;hr data-end=&quot;1967&quot; data-start=&quot;1964&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h3 data-end=&quot;1983&quot; data-start=&quot;1969&quot; data-section-id=&quot;12a4xsi&quot; data-ke-size=&quot;size23&quot;&gt;✔ Step 2&lt;/h3&gt;
&lt;p data-end=&quot;2008&quot; data-start=&quot;1984&quot; data-ke-size=&quot;size16&quot;&gt;AIC로 1차 필터링&lt;br /&gt;&amp;rarr; 예측 성능 기준&lt;/p&gt;
&lt;hr data-end=&quot;2013&quot; data-start=&quot;2010&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h3 data-end=&quot;2029&quot; data-start=&quot;2015&quot; data-section-id=&quot;12a4x03&quot; data-ke-size=&quot;size23&quot;&gt;✔ Step 3&lt;/h3&gt;
&lt;p data-end=&quot;2052&quot; data-start=&quot;2030&quot; data-ke-size=&quot;size16&quot;&gt;BIC로 2차 필터링&lt;br /&gt;&amp;rarr; 변수 최소화&lt;/p&gt;
&lt;hr data-end=&quot;2057&quot; data-start=&quot;2054&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;p data-end=&quot;2064&quot; data-start=&quot;2059&quot; data-ke-size=&quot;size16&quot;&gt;  즉,&lt;/p&gt;
&lt;blockquote data-end=&quot;2097&quot; data-start=&quot;2066&quot; data-ke-style=&quot;style1&quot;&gt;
&lt;p data-end=&quot;2097&quot; data-start=&quot;2068&quot; data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;AIC로 넓게 보고,&lt;br /&gt;BIC로 정리한다&lt;/b&gt;&lt;/p&gt;
&lt;/blockquote&gt;
&lt;hr data-end=&quot;2102&quot; data-start=&quot;2099&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h1 data-end=&quot;2115&quot; data-start=&quot;2104&quot; data-section-id=&quot;jk77q&quot;&gt;9) 한 장 요약&lt;/h1&gt;
&lt;div&gt;
&lt;div&gt;&lt;b&gt;개념&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 의미&lt;/b&gt;
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-end=&quot;2249&quot; data-start=&quot;2117&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody data-end=&quot;2249&quot; data-start=&quot;2145&quot;&gt;
&lt;tr data-end=&quot;2175&quot; data-start=&quot;2145&quot;&gt;
&lt;td data-col-size=&quot;sm&quot; data-end=&quot;2151&quot; data-start=&quot;2145&quot;&gt;BIC&lt;/td&gt;
&lt;td data-col-size=&quot;sm&quot; data-end=&quot;2175&quot; data-start=&quot;2151&quot;&gt;모델 선택 기준 (AIC보다 보수적)&lt;/td&gt;
&lt;/tr&gt;
&lt;tr data-end=&quot;2198&quot; data-start=&quot;2176&quot;&gt;
&lt;td data-col-size=&quot;sm&quot; data-end=&quot;2181&quot; data-start=&quot;2176&quot;&gt;핵심&lt;/td&gt;
&lt;td data-col-size=&quot;sm&quot; data-end=&quot;2198&quot; data-start=&quot;2181&quot;&gt;복잡도 패널티가 더 강함&lt;/td&gt;
&lt;/tr&gt;
&lt;tr data-end=&quot;2225&quot; data-start=&quot;2199&quot;&gt;
&lt;td data-col-size=&quot;sm&quot; data-end=&quot;2204&quot; data-start=&quot;2199&quot;&gt;특징&lt;/td&gt;
&lt;td data-end=&quot;2225&quot; data-start=&quot;2204&quot; data-col-size=&quot;sm&quot;&gt;데이터 많을수록 변수 제거 강함&lt;/td&gt;
&lt;/tr&gt;
&lt;tr data-end=&quot;2249&quot; data-start=&quot;2226&quot;&gt;
&lt;td data-col-size=&quot;sm&quot; data-end=&quot;2231&quot; data-start=&quot;2226&quot;&gt;목적&lt;/td&gt;
&lt;td data-col-size=&quot;sm&quot; data-end=&quot;2249&quot; data-start=&quot;2231&quot;&gt;진짜 중요한 변수만 남기기&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;/div&gt;
&lt;/div&gt;
&lt;hr data-end=&quot;2254&quot; data-start=&quot;2251&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h1 data-end=&quot;2268&quot; data-start=&quot;2256&quot; data-section-id=&quot;1bmx1pi&quot;&gt;  핵심 한 문장&lt;/h1&gt;
&lt;blockquote data-end=&quot;2312&quot; data-start=&quot;2270&quot; data-ke-style=&quot;style1&quot;&gt;
&lt;p data-end=&quot;2312&quot; data-start=&quot;2272&quot; data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;&amp;ldquo;BIC는 &amp;lsquo;정확한 모델&amp;rsquo;보다 &amp;lsquo;간결한 진짜 모델&amp;rsquo;을 선택한다.&amp;rdquo;&lt;/b&gt;&lt;/p&gt;
&lt;/blockquote&gt;
&lt;p data-end=&quot;2459&quot; data-start=&quot;2436&quot; data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;</description>
      <category>Statistics/기초 통계</category>
      <category>Ai</category>
      <category>AIC</category>
      <category>bic</category>
      <category>데이터</category>
      <category>데이터분석</category>
      <category>머신러닝</category>
      <category>모델</category>
      <category>복잡도</category>
      <category>통계</category>
      <author>Allen93</author>
      <guid isPermaLink="true">https://allensdatablog.tistory.com/485</guid>
      <comments>https://allensdatablog.tistory.com/entry/BIC%EB%9E%80-%EB%AC%B4%EC%97%87%EC%9D%B8%EA%B0%80-%E2%80%94-AIC%EC%99%80-%EB%AC%B4%EC%97%87%EC%9D%B4-%EB%8B%A4%EB%A5%BC%EA%B9%8C#entry485comment</comments>
      <pubDate>Fri, 10 Apr 2026 11:10:43 +0900</pubDate>
    </item>
    <item>
      <title>AIC란 무엇인가 - &amp;quot;좋은 모델&amp;quot;을 고르는 기준</title>
      <link>https://allensdatablog.tistory.com/entry/AIC%EB%9E%80-%EB%AC%B4%EC%97%87%EC%9D%B8%EA%B0%80-%EC%A2%8B%EC%9D%80-%EB%AA%A8%EB%8D%B8%EC%9D%84-%EA%B3%A0%EB%A5%B4%EB%8A%94-%EA%B8%B0%EC%A4%80</link>
      <description>&lt;p data-end=&quot;259&quot; data-start=&quot;231&quot; data-ke-size=&quot;size16&quot;&gt;모델을 여러 개 만들다 보면 이런 상황이 생깁니다.&lt;/p&gt;
&lt;blockquote data-end=&quot;308&quot; data-start=&quot;261&quot; data-ke-style=&quot;style1&quot;&gt;
&lt;p data-end=&quot;308&quot; data-start=&quot;263&quot; data-ke-size=&quot;size16&quot;&gt;&amp;ldquo;이 모델도 괜찮고&amp;hellip; 저 모델도 괜찮은데&lt;br /&gt;도대체 뭐가 더 좋은 모델이지?&amp;rdquo;&lt;/p&gt;
&lt;/blockquote&gt;
&lt;p data-end=&quot;338&quot; data-start=&quot;310&quot; data-ke-size=&quot;size16&quot;&gt;예를 들어 자동차 연비 모델을 만들었다고 해봅시다.&lt;/p&gt;
&lt;h3 data-end=&quot;350&quot; data-start=&quot;340&quot; data-section-id=&quot;1758nzr&quot; data-ke-size=&quot;size23&quot;&gt;모델 A&lt;/h3&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;374&quot; data-start=&quot;351&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;360&quot; data-start=&quot;351&quot; data-section-id=&quot;o4qzi6&quot;&gt;변수 2개&lt;/li&gt;
&lt;li data-end=&quot;374&quot; data-start=&quot;361&quot; data-section-id=&quot;wrpuum&quot;&gt;R&amp;sup2; = 0.72&lt;/li&gt;
&lt;/ul&gt;
&lt;h3 data-end=&quot;386&quot; data-start=&quot;376&quot; data-section-id=&quot;1758juc&quot; data-ke-size=&quot;size23&quot;&gt;모델 B&lt;/h3&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;410&quot; data-start=&quot;387&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;396&quot; data-start=&quot;387&quot; data-section-id=&quot;o4tvp6&quot;&gt;변수 6개&lt;/li&gt;
&lt;li data-end=&quot;410&quot; data-start=&quot;397&quot; data-section-id=&quot;wrhhxi&quot;&gt;R&amp;sup2; = 0.85&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-end=&quot;440&quot; data-start=&quot;412&quot; data-ke-size=&quot;size16&quot;&gt;겉으로 보면 B가 좋아 보이죠.&lt;br /&gt;하지만 문제는&amp;hellip;&lt;/p&gt;
&lt;blockquote data-end=&quot;471&quot; data-start=&quot;442&quot; data-ke-style=&quot;style1&quot;&gt;
&lt;p data-end=&quot;471&quot; data-start=&quot;444&quot; data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;변수를 많이 넣으면 R&amp;sup2;는 무조건 올라간다&lt;/b&gt;&lt;/p&gt;
&lt;/blockquote&gt;
&lt;p data-end=&quot;521&quot; data-start=&quot;473&quot; data-ke-size=&quot;size16&quot;&gt;즉, B는 &amp;ldquo;더 좋은 모델&amp;rdquo;이 아니라&lt;br /&gt;&lt;b&gt;그냥 더 복잡한 모델&lt;/b&gt;일 수도 있습니다.&lt;/p&gt;
&lt;p data-end=&quot;551&quot; data-start=&quot;523&quot; data-ke-size=&quot;size16&quot;&gt;이걸 해결하기 위해 등장한 것이 바로 AIC입니다.&lt;/p&gt;
&lt;p&gt;&lt;figure class=&quot;imageblock alignCenter&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;1536&quot; data-origin-height=&quot;1024&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/nlpQ2/dJMcahxdtmn/rWjlkK5N51Wg50zegLWKmk/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/nlpQ2/dJMcahxdtmn/rWjlkK5N51Wg50zegLWKmk/img.png&quot; data-alt=&quot;AIC&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/nlpQ2/dJMcahxdtmn/rWjlkK5N51Wg50zegLWKmk/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2FnlpQ2%2FdJMcahxdtmn%2FrWjlkK5N51Wg50zegLWKmk%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;1536&quot; height=&quot;1024&quot; data-origin-width=&quot;1536&quot; data-origin-height=&quot;1024&quot;/&gt;&lt;/span&gt;&lt;figcaption&gt;AIC&lt;/figcaption&gt;
&lt;/figure&gt;
&lt;/p&gt;
&lt;hr data-end=&quot;556&quot; data-start=&quot;553&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h1 data-end=&quot;575&quot; data-start=&quot;558&quot; data-section-id=&quot;rkoi3o&quot;&gt;1) AIC의 핵심 아이디어&lt;/h1&gt;
&lt;p data-end=&quot;600&quot; data-start=&quot;577&quot; data-ke-size=&quot;size16&quot;&gt;AIC는 한 문장으로 정리하면 이렇습니다.&lt;/p&gt;
&lt;blockquote data-end=&quot;640&quot; data-start=&quot;602&quot; data-ke-style=&quot;style1&quot;&gt;
&lt;p data-end=&quot;640&quot; data-start=&quot;604&quot; data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;&amp;ldquo;모델의 적합도와 복잡도를 동시에 고려해서 점수를 매긴다&amp;rdquo;&lt;/b&gt;&lt;/p&gt;
&lt;/blockquote&gt;
&lt;p data-end=&quot;644&quot; data-start=&quot;642&quot; data-ke-size=&quot;size16&quot;&gt;즉,&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;690&quot; data-start=&quot;646&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;669&quot; data-start=&quot;646&quot; data-section-id=&quot;o7cjqm&quot;&gt;데이터에 잘 맞는 모델을 원하면서도&lt;/li&gt;
&lt;li data-end=&quot;690&quot; data-start=&quot;670&quot; data-section-id=&quot;1u6wjcs&quot;&gt;너무 복잡한 모델은 패널티를 준다&lt;/li&gt;
&lt;/ul&gt;
&lt;hr data-end=&quot;695&quot; data-start=&quot;692&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h1 data-end=&quot;717&quot; data-start=&quot;697&quot; data-section-id=&quot;1yxl25m&quot;&gt;2) AIC 공식 (그리고 직관)&lt;/h1&gt;
&lt;blockquote data-ke-style=&quot;style3&quot;&gt;AIC=2k&amp;minus;2ln⁡(L)&lt;/blockquote&gt;
&lt;p data-end=&quot;756&quot; data-start=&quot;745&quot; data-ke-size=&quot;size16&quot;&gt;이걸 쉽게 풀어보면:&lt;/p&gt;
&lt;div&gt;
&lt;div&gt;항목의미
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-end=&quot;850&quot; data-start=&quot;758&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody data-end=&quot;850&quot; data-start=&quot;786&quot;&gt;
&lt;tr data-end=&quot;808&quot; data-start=&quot;786&quot;&gt;
&lt;td data-col-size=&quot;sm&quot; data-end=&quot;790&quot; data-start=&quot;786&quot;&gt;k&lt;/td&gt;
&lt;td data-col-size=&quot;sm&quot; data-end=&quot;808&quot; data-start=&quot;790&quot;&gt;변수 개수 (모델 복잡도)&lt;/td&gt;
&lt;/tr&gt;
&lt;tr data-end=&quot;850&quot; data-start=&quot;809&quot;&gt;
&lt;td data-col-size=&quot;sm&quot; data-end=&quot;813&quot; data-start=&quot;809&quot;&gt;L&lt;/td&gt;
&lt;td data-col-size=&quot;sm&quot; data-end=&quot;850&quot; data-start=&quot;813&quot;&gt;likelihood (모델이 데이터를 얼마나 잘 설명하는지)&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;/div&gt;
&lt;/div&gt;
&lt;p data-end=&quot;854&quot; data-start=&quot;852&quot; data-ke-size=&quot;size16&quot;&gt;즉,&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style3&quot;&gt;AIC=복잡도 패널티+적합도 점수&lt;/blockquote&gt;
&lt;hr data-end=&quot;903&quot; data-start=&quot;900&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h3 data-end=&quot;917&quot; data-start=&quot;905&quot; data-section-id=&quot;4ap2fr&quot; data-ke-size=&quot;size23&quot;&gt;✔ 해석 포인트&lt;/h3&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;976&quot; data-start=&quot;919&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;947&quot; data-start=&quot;919&quot; data-section-id=&quot;jszyxe&quot;&gt;&lt;b&gt;k가 커지면 &amp;rarr; AIC 증가 (불리)&lt;/b&gt;&lt;/li&gt;
&lt;li data-end=&quot;976&quot; data-start=&quot;948&quot; data-section-id=&quot;y46d54&quot;&gt;&lt;b&gt;L이 커지면 &amp;rarr; AIC 감소 (유리)&lt;/b&gt;&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-end=&quot;1010&quot; data-start=&quot;978&quot; data-ke-size=&quot;size16&quot;&gt;  좋은 모델은?&lt;br /&gt;&amp;rarr; &lt;b&gt;AIC가 가장 작은 모델&lt;/b&gt;&lt;/p&gt;
&lt;hr data-end=&quot;1015&quot; data-start=&quot;1012&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h1 data-end=&quot;1040&quot; data-start=&quot;1017&quot; data-section-id=&quot;1kx049a&quot;&gt;3) 왜 이런 구조일까? (핵심 직관)&lt;/h1&gt;
&lt;p data-end=&quot;1064&quot; data-start=&quot;1042&quot; data-ke-size=&quot;size16&quot;&gt;AIC는 사실 이런 철학에서 출발합니다.&lt;/p&gt;
&lt;blockquote data-end=&quot;1096&quot; data-start=&quot;1066&quot; data-ke-style=&quot;style1&quot;&gt;
&lt;p data-end=&quot;1096&quot; data-start=&quot;1068&quot; data-ke-size=&quot;size16&quot;&gt;&amp;ldquo;미래 데이터를 가장 잘 예측할 모델은 무엇인가?&amp;rdquo;&lt;/p&gt;
&lt;/blockquote&gt;
&lt;p data-end=&quot;1110&quot; data-start=&quot;1098&quot; data-ke-size=&quot;size16&quot;&gt;여기서 중요한 포인트:&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;1167&quot; data-start=&quot;1112&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;1136&quot; data-start=&quot;1112&quot; data-section-id=&quot;1tfgrjk&quot;&gt;너무 단순한 모델 &amp;rarr; 데이터 못 설명&lt;/li&gt;
&lt;li data-end=&quot;1167&quot; data-start=&quot;1137&quot; data-section-id=&quot;s52ju&quot;&gt;너무 복잡한 모델 &amp;rarr; 과적합(overfitting)&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-end=&quot;1191&quot; data-start=&quot;1169&quot; data-ke-size=&quot;size16&quot;&gt;AIC는 이 둘 사이의 균형을 잡습니다.&lt;/p&gt;
&lt;hr data-end=&quot;1196&quot; data-start=&quot;1193&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h1 data-end=&quot;1215&quot; data-start=&quot;1198&quot; data-section-id=&quot;1s8rcca&quot;&gt;4) 자동차 예시로 이해하기&lt;/h1&gt;
&lt;p data-end=&quot;1243&quot; data-start=&quot;1217&quot; data-ke-size=&quot;size16&quot;&gt;연비(Y)를 예측하는 모델을 만든다고 해봅시다.&lt;/p&gt;
&lt;h3 data-end=&quot;1255&quot; data-start=&quot;1245&quot; data-section-id=&quot;175607b&quot; data-ke-size=&quot;size23&quot;&gt;모델 1&lt;/h3&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;1283&quot; data-start=&quot;1256&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;1269&quot; data-start=&quot;1256&quot; data-section-id=&quot;8m10ab&quot;&gt;변수: 차량 무게&lt;/li&gt;
&lt;li data-end=&quot;1283&quot; data-start=&quot;1270&quot; data-section-id=&quot;1impvjh&quot;&gt;AIC = 210&lt;/li&gt;
&lt;/ul&gt;
&lt;h3 data-end=&quot;1295&quot; data-start=&quot;1285&quot; data-section-id=&quot;1755zb8&quot; data-ke-size=&quot;size23&quot;&gt;모델 2&lt;/h3&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;1326&quot; data-start=&quot;1296&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;1312&quot; data-start=&quot;1296&quot; data-section-id=&quot;1lk13zk&quot;&gt;변수: 무게 + 배기량&lt;/li&gt;
&lt;li data-end=&quot;1326&quot; data-start=&quot;1313&quot; data-section-id=&quot;1in8d1j&quot;&gt;AIC = 180&lt;/li&gt;
&lt;/ul&gt;
&lt;h3 data-end=&quot;1338&quot; data-start=&quot;1328&quot; data-section-id=&quot;1755yit&quot; data-ke-size=&quot;size23&quot;&gt;모델 3&lt;/h3&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;1390&quot; data-start=&quot;1339&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;1376&quot; data-start=&quot;1339&quot; data-section-id=&quot;ru2isg&quot;&gt;변수: 무게 + 배기량 + 마력 + 타이어 + 온도 + 습도&lt;/li&gt;
&lt;li data-end=&quot;1390&quot; data-start=&quot;1377&quot; data-section-id=&quot;1in928z&quot;&gt;AIC = 195&lt;/li&gt;
&lt;/ul&gt;
&lt;hr data-end=&quot;1395&quot; data-start=&quot;1392&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h3 data-end=&quot;1403&quot; data-start=&quot;1397&quot; data-section-id=&quot;1hrnne7&quot; data-ke-size=&quot;size23&quot;&gt;해석&lt;/h3&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;1463&quot; data-start=&quot;1405&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;1430&quot; data-start=&quot;1405&quot; data-section-id=&quot;n4e76a&quot;&gt;모델 2가 가장 낮음 &amp;rarr; &lt;b&gt;최적 모델&lt;/b&gt;&lt;/li&gt;
&lt;li data-end=&quot;1463&quot; data-start=&quot;1431&quot; data-section-id=&quot;98asch&quot;&gt;모델 3은 변수 많지만 AIC가 증가 &amp;rarr; &lt;b&gt;과적합&lt;/b&gt;&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-end=&quot;1476&quot; data-start=&quot;1465&quot; data-ke-size=&quot;size16&quot;&gt;  중요한 포인트:&lt;/p&gt;
&lt;blockquote data-end=&quot;1529&quot; data-start=&quot;1478&quot; data-ke-style=&quot;style1&quot;&gt;
&lt;p data-end=&quot;1529&quot; data-start=&quot;1480&quot; data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;변수가 많다고 좋은 모델이 아니다&lt;br /&gt;필요한 만큼만 쓰는 모델이 좋은 모델이다&lt;/b&gt;&lt;/p&gt;
&lt;/blockquote&gt;
&lt;hr data-end=&quot;1534&quot; data-start=&quot;1531&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h1 data-end=&quot;1552&quot; data-start=&quot;1536&quot; data-section-id=&quot;bqxnu1&quot;&gt;5) AIC의 실무 사용법&lt;/h1&gt;
&lt;p data-end=&quot;1591&quot; data-start=&quot;1554&quot; data-ke-size=&quot;size16&quot;&gt;AIC는 &amp;ldquo;절대값&amp;rdquo;이 아니라&lt;br /&gt;&lt;b&gt;모델 간 비교용 지표&lt;/b&gt;입니다.&lt;/p&gt;
&lt;h3 data-end=&quot;1604&quot; data-start=&quot;1593&quot; data-section-id=&quot;1mp05jy&quot; data-ke-size=&quot;size23&quot;&gt;✔ 중요 원칙&lt;/h3&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;1668&quot; data-start=&quot;1606&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;1625&quot; data-start=&quot;1606&quot; data-section-id=&quot;145vfnv&quot;&gt;AIC 값 자체는 의미 없음&lt;/li&gt;
&lt;li data-end=&quot;1651&quot; data-start=&quot;1626&quot; data-section-id=&quot;v9zcjh&quot;&gt;반드시 &lt;b&gt;여러 모델 비교&lt;/b&gt;에서 사용&lt;/li&gt;
&lt;li data-end=&quot;1668&quot; data-start=&quot;1652&quot; data-section-id=&quot;1jyog96&quot;&gt;가장 작은 AIC 선택&lt;/li&gt;
&lt;/ul&gt;
&lt;hr data-end=&quot;1673&quot; data-start=&quot;1670&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h3 data-end=&quot;1692&quot; data-start=&quot;1675&quot; data-section-id=&quot;1evzjt&quot; data-ke-size=&quot;size23&quot;&gt;✔ 차이(&amp;Delta;AIC) 해석&lt;/h3&gt;
&lt;div&gt;
&lt;div&gt;&amp;Delta;AIC해석
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-end=&quot;1781&quot; data-start=&quot;1694&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody data-end=&quot;1781&quot; data-start=&quot;1724&quot;&gt;
&lt;tr data-end=&quot;1741&quot; data-start=&quot;1724&quot;&gt;
&lt;td data-col-size=&quot;sm&quot; data-end=&quot;1732&quot; data-start=&quot;1724&quot;&gt;0 ~ 2&lt;/td&gt;
&lt;td data-end=&quot;1741&quot; data-start=&quot;1732&quot; data-col-size=&quot;sm&quot;&gt;거의 동일&lt;/td&gt;
&lt;/tr&gt;
&lt;tr data-end=&quot;1759&quot; data-start=&quot;1742&quot;&gt;
&lt;td data-col-size=&quot;sm&quot; data-end=&quot;1750&quot; data-start=&quot;1742&quot;&gt;4 ~ 7&lt;/td&gt;
&lt;td data-col-size=&quot;sm&quot; data-end=&quot;1759&quot; data-start=&quot;1750&quot;&gt;차이 있음&lt;/td&gt;
&lt;/tr&gt;
&lt;tr data-end=&quot;1781&quot; data-start=&quot;1760&quot;&gt;
&lt;td data-col-size=&quot;sm&quot; data-end=&quot;1768&quot; data-start=&quot;1760&quot;&gt;10 이상&lt;/td&gt;
&lt;td data-col-size=&quot;sm&quot; data-end=&quot;1781&quot; data-start=&quot;1768&quot;&gt;완전히 다른 수준&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;/div&gt;
&lt;/div&gt;
&lt;hr data-end=&quot;1786&quot; data-start=&quot;1783&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h1 data-end=&quot;1827&quot; data-start=&quot;1788&quot; data-section-id=&quot;mkgd3r&quot;&gt;6) AIC vs R&amp;sup2; vs p-value (헷갈리는 포인트 정리)&lt;/h1&gt;
&lt;div&gt;
&lt;div&gt;지표역할
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-end=&quot;1903&quot; data-start=&quot;1829&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody data-end=&quot;1903&quot; data-start=&quot;1857&quot;&gt;
&lt;tr data-end=&quot;1869&quot; data-start=&quot;1857&quot;&gt;
&lt;td data-col-size=&quot;sm&quot; data-end=&quot;1862&quot; data-start=&quot;1857&quot;&gt;R&amp;sup2;&lt;/td&gt;
&lt;td data-col-size=&quot;sm&quot; data-end=&quot;1869&quot; data-start=&quot;1862&quot;&gt;설명력&lt;/td&gt;
&lt;/tr&gt;
&lt;tr data-end=&quot;1887&quot; data-start=&quot;1870&quot;&gt;
&lt;td data-col-size=&quot;sm&quot; data-end=&quot;1880&quot; data-start=&quot;1870&quot;&gt;p-value&lt;/td&gt;
&lt;td data-col-size=&quot;sm&quot; data-end=&quot;1887&quot; data-start=&quot;1880&quot;&gt;유의성&lt;/td&gt;
&lt;/tr&gt;
&lt;tr data-end=&quot;1903&quot; data-start=&quot;1888&quot;&gt;
&lt;td data-col-size=&quot;sm&quot; data-end=&quot;1894&quot; data-start=&quot;1888&quot;&gt;AIC&lt;/td&gt;
&lt;td data-col-size=&quot;sm&quot; data-end=&quot;1903&quot; data-start=&quot;1894&quot;&gt;모델 선택&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;/div&gt;
&lt;/div&gt;
&lt;p data-end=&quot;1911&quot; data-start=&quot;1905&quot; data-ke-size=&quot;size16&quot;&gt;  핵심:&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;1982&quot; data-start=&quot;1913&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;1931&quot; data-start=&quot;1913&quot; data-section-id=&quot;lce49w&quot;&gt;R&amp;sup2; &amp;rarr; 얼마나 잘 맞는가&lt;/li&gt;
&lt;li data-end=&quot;1957&quot; data-start=&quot;1932&quot; data-section-id=&quot;1hjf6xo&quot;&gt;p-value &amp;rarr; 이 변수 의미 있는가&lt;/li&gt;
&lt;li data-end=&quot;1982&quot; data-start=&quot;1958&quot; data-section-id=&quot;jyhby3&quot;&gt;AIC &amp;rarr; 전체 모델 중 뭐가 좋은가&lt;/li&gt;
&lt;/ul&gt;
&lt;hr data-end=&quot;1987&quot; data-start=&quot;1984&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h1 data-end=&quot;2008&quot; data-start=&quot;1989&quot; data-section-id=&quot;1hh961f&quot;&gt;7) AIC가 특히 중요한 상황&lt;/h1&gt;
&lt;p data-end=&quot;2032&quot; data-start=&quot;2010&quot; data-ke-size=&quot;size16&quot;&gt;AIC는 아래 상황에서 매우 강력합니다.&lt;/p&gt;
&lt;hr data-end=&quot;2037&quot; data-start=&quot;2034&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h3 data-end=&quot;2073&quot; data-start=&quot;2039&quot; data-section-id=&quot;lqwuka&quot; data-ke-size=&quot;size23&quot;&gt;✔ 1) 변수 선택 (Feature Selection)&lt;/h3&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;2121&quot; data-start=&quot;2075&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;2086&quot; data-start=&quot;2075&quot; data-section-id=&quot;mvaquu&quot;&gt;변수 많을 때&lt;/li&gt;
&lt;li data-end=&quot;2110&quot; data-start=&quot;2087&quot; data-section-id=&quot;wdn5tp&quot;&gt;Stepwise regression&lt;/li&gt;
&lt;li data-end=&quot;2121&quot; data-start=&quot;2111&quot; data-section-id=&quot;14ywwhw&quot;&gt;자동 변수 선택&lt;/li&gt;
&lt;/ul&gt;
&lt;hr data-end=&quot;2126&quot; data-start=&quot;2123&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h3 data-end=&quot;2142&quot; data-start=&quot;2128&quot; data-section-id=&quot;13es1t9&quot; data-ke-size=&quot;size23&quot;&gt;✔ 2) 모델 비교&lt;/h3&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;2199&quot; data-start=&quot;2144&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;2163&quot; data-start=&quot;2144&quot; data-section-id=&quot;dqxsfh&quot;&gt;선형 vs 로그 vs 다항식&lt;/li&gt;
&lt;li data-end=&quot;2178&quot; data-start=&quot;2164&quot; data-section-id=&quot;ck7wwh&quot;&gt;포아송 vs 음이항&lt;/li&gt;
&lt;li data-end=&quot;2199&quot; data-start=&quot;2179&quot; data-section-id=&quot;14ouqms&quot;&gt;로지스틱 vs 다른 분류 모델&lt;/li&gt;
&lt;/ul&gt;
&lt;hr data-end=&quot;2204&quot; data-start=&quot;2201&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h3 data-end=&quot;2221&quot; data-start=&quot;2206&quot; data-section-id=&quot;w7to1h&quot; data-ke-size=&quot;size23&quot;&gt;✔ 3) 과적합 방지&lt;/h3&gt;
&lt;p data-end=&quot;2244&quot; data-start=&quot;2223&quot; data-ke-size=&quot;size16&quot;&gt;AIC는 자동으로 이런 걸 막아줍니다:&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;2294&quot; data-start=&quot;2246&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;2260&quot; data-start=&quot;2246&quot; data-section-id=&quot;1ctbxmm&quot;&gt;쓸데없는 변수 추가&lt;/li&gt;
&lt;li data-end=&quot;2274&quot; data-start=&quot;2261&quot; data-section-id=&quot;1czk4l1&quot;&gt;모델 복잡도 증가&lt;/li&gt;
&lt;li data-end=&quot;2294&quot; data-start=&quot;2275&quot; data-section-id=&quot;y7k2ws&quot;&gt;설명력만 보고 판단하는 실수&lt;/li&gt;
&lt;/ul&gt;
&lt;hr data-end=&quot;2299&quot; data-start=&quot;2296&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h1 data-end=&quot;2318&quot; data-start=&quot;2301&quot; data-section-id=&quot;16yltbs&quot;&gt;8) AIC의 한계 (중요)&lt;/h1&gt;
&lt;p data-end=&quot;2338&quot; data-start=&quot;2320&quot; data-ke-size=&quot;size16&quot;&gt;AIC도 완벽한 지표는 아닙니다.&lt;/p&gt;
&lt;hr data-end=&quot;2343&quot; data-start=&quot;2340&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h3 data-end=&quot;2370&quot; data-start=&quot;2345&quot; data-section-id=&quot;wen2bw&quot; data-ke-size=&quot;size23&quot;&gt;❗ 1) 표본이 너무 적으면 부정확&lt;/h3&gt;
&lt;p data-end=&quot;2386&quot; data-start=&quot;2371&quot; data-ke-size=&quot;size16&quot;&gt;&amp;rarr; 이럴 때는 AICc 사용&lt;/p&gt;
&lt;hr data-end=&quot;2391&quot; data-start=&quot;2388&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h3 data-end=&quot;2414&quot; data-start=&quot;2393&quot; data-section-id=&quot;17j3gfa&quot; data-ke-size=&quot;size23&quot;&gt;❗ 2) 해석 모델에는 부족&lt;/h3&gt;
&lt;p data-end=&quot;2431&quot; data-start=&quot;2415&quot; data-ke-size=&quot;size16&quot;&gt;&amp;rarr; 변수 의미는 따로 봐야 함&lt;/p&gt;
&lt;hr data-end=&quot;2436&quot; data-start=&quot;2433&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h3 data-end=&quot;2458&quot; data-start=&quot;2438&quot; data-section-id=&quot;1buxf8u&quot; data-ke-size=&quot;size23&quot;&gt;❗ 3) 절대적 기준 아님&lt;/h3&gt;
&lt;p data-end=&quot;2467&quot; data-start=&quot;2459&quot; data-ke-size=&quot;size16&quot;&gt;&amp;rarr; 항상 비교용&lt;/p&gt;
&lt;hr data-end=&quot;2472&quot; data-start=&quot;2469&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h1 data-end=&quot;2485&quot; data-start=&quot;2474&quot; data-section-id=&quot;jk77q&quot;&gt;9) 한 장 요약&lt;/h1&gt;
&lt;div&gt;
&lt;div&gt;&lt;b&gt;개념&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 의미&lt;/b&gt;
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-end=&quot;2612&quot; data-start=&quot;2487&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody data-end=&quot;2612&quot; data-start=&quot;2515&quot;&gt;
&lt;tr data-end=&quot;2533&quot; data-start=&quot;2515&quot;&gt;
&lt;td data-col-size=&quot;sm&quot; data-end=&quot;2521&quot; data-start=&quot;2515&quot;&gt;AIC&lt;/td&gt;
&lt;td data-col-size=&quot;sm&quot; data-end=&quot;2533&quot; data-start=&quot;2521&quot;&gt;모델 선택 기준&lt;/td&gt;
&lt;/tr&gt;
&lt;tr data-end=&quot;2555&quot; data-start=&quot;2534&quot;&gt;
&lt;td data-col-size=&quot;sm&quot; data-end=&quot;2539&quot; data-start=&quot;2534&quot;&gt;핵심&lt;/td&gt;
&lt;td data-col-size=&quot;sm&quot; data-end=&quot;2555&quot; data-start=&quot;2539&quot;&gt;적합도 + 복잡도 균형&lt;/td&gt;
&lt;/tr&gt;
&lt;tr data-end=&quot;2573&quot; data-start=&quot;2556&quot;&gt;
&lt;td data-col-size=&quot;sm&quot; data-end=&quot;2561&quot; data-start=&quot;2556&quot;&gt;목표&lt;/td&gt;
&lt;td data-col-size=&quot;sm&quot; data-end=&quot;2573&quot; data-start=&quot;2561&quot;&gt;미래 예측 성능&lt;/td&gt;
&lt;/tr&gt;
&lt;tr data-end=&quot;2592&quot; data-start=&quot;2574&quot;&gt;
&lt;td data-col-size=&quot;sm&quot; data-end=&quot;2579&quot; data-start=&quot;2574&quot;&gt;기준&lt;/td&gt;
&lt;td data-col-size=&quot;sm&quot; data-end=&quot;2592&quot; data-start=&quot;2579&quot;&gt;가장 작은 AIC&lt;/td&gt;
&lt;/tr&gt;
&lt;tr data-end=&quot;2612&quot; data-start=&quot;2593&quot;&gt;
&lt;td data-col-size=&quot;sm&quot; data-end=&quot;2598&quot; data-start=&quot;2593&quot;&gt;특징&lt;/td&gt;
&lt;td data-col-size=&quot;sm&quot; data-end=&quot;2612&quot; data-start=&quot;2598&quot;&gt;변수 많으면 패널티&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;/div&gt;
&lt;/div&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;</description>
      <category>Statistics/기초 통계</category>
      <category>Ai</category>
      <category>AIC</category>
      <category>bic</category>
      <category>데이터사이언스</category>
      <category>모델링</category>
      <category>복잡도</category>
      <category>적합도</category>
      <category>최대우도</category>
      <category>통계</category>
      <author>Allen93</author>
      <guid isPermaLink="true">https://allensdatablog.tistory.com/484</guid>
      <comments>https://allensdatablog.tistory.com/entry/AIC%EB%9E%80-%EB%AC%B4%EC%97%87%EC%9D%B8%EA%B0%80-%EC%A2%8B%EC%9D%80-%EB%AA%A8%EB%8D%B8%EC%9D%84-%EA%B3%A0%EB%A5%B4%EB%8A%94-%EA%B8%B0%EC%A4%80#entry484comment</comments>
      <pubDate>Tue, 7 Apr 2026 08:45:29 +0900</pubDate>
    </item>
    <item>
      <title>27. 기초 통계학 총정리 - 모든 개념을 하나로 연결하는 '통계의 큰 그림'</title>
      <link>https://allensdatablog.tistory.com/entry/26-%EA%B8%B0%EC%B4%88-%ED%86%B5%EA%B3%84%ED%95%99-%EC%B4%9D%EC%A0%95%EB%A6%AC-%EB%AA%A8%EB%93%A0-%EA%B0%9C%EB%85%90%EC%9D%84-%ED%95%98%EB%82%98%EB%A1%9C-%EC%97%B0%EA%B2%B0%ED%95%98%EB%8A%94-%ED%86%B5%EA%B3%84%EC%9D%98-%ED%81%B0-%EA%B7%B8%EB%A6%BC</link>
      <description>&lt;p data-ke-size=&quot;size16&quot;&gt;기초 통계를 한 챕터씩 따라오다 보면&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;머릿속에 이런 질문이 떠오릅니다.&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;&quot;정규분포, 추정, 검정, 회귀, DOE...&lt;br /&gt;도대체 이 모든 게 어떻게 하나로 이어지는 걸까?&quot;&lt;/blockquote&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;개념 하나하나는 이해했지만&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;전체 구조가 어떻게 연결되는지&lt;/b&gt; 보이지 않으면&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;실전에서 써먹기 어렵습니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이번 글은 시리즈의 마지막으로,&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이 모든 개념을 &quot;하나의 흐름&quot;으로 정리해 드립니다.&lt;/p&gt;
&lt;p&gt;&lt;figure class=&quot;imageblock alignCenter&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;1024&quot; data-origin-height=&quot;1024&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/bbK6r9/dJMcacavKHf/qDkkV5bTIhlFnNkhg0WZK0/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/bbK6r9/dJMcacavKHf/qDkkV5bTIhlFnNkhg0WZK0/img.png&quot; data-alt=&quot;통계&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/bbK6r9/dJMcacavKHf/qDkkV5bTIhlFnNkhg0WZK0/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2FbbK6r9%2FdJMcacavKHf%2FqDkkV5bTIhlFnNkhg0WZK0%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;665&quot; height=&quot;665&quot; data-origin-width=&quot;1024&quot; data-origin-height=&quot;1024&quot;/&gt;&lt;/span&gt;&lt;figcaption&gt;통계&lt;/figcaption&gt;
&lt;/figure&gt;
&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;1. 모든 통계의 출발점: &quot;표본 -&amp;gt; 모집단 추정&quot;&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;통계의 뼈대는 이 한 문장으로 요약됩니다.&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;&lt;b&gt;보이지 않는 전체(모집단)를&lt;/b&gt;&lt;br /&gt;&lt;b&gt;보이는 일부(표본)를 통해 추정한다.&lt;/b&gt;&lt;/blockquote&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이 철학을 바탕으로 우리가 배웠던 개념들이 등장합니다.&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;표본추출&lt;/li&gt;
&lt;li&gt;평균&amp;bull;분산 같은 요약통계&lt;/li&gt;
&lt;li&gt;확률 분포&lt;/li&gt;
&lt;li&gt;정규성&lt;/li&gt;
&lt;li&gt;중심극한정리&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이건 모두 &quot;표본이 전체를 얼마나 잘 대표하는가?&quot;를 이해하기 위한 도구입니다.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;2. 추정과 점정: &quot;우리가 본 게 우연일까, 진짜일까?&quot;&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;데이터를 얻은 뒤 다음 질문은 항상 이것입니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;&quot;이 차이가 우연일까? 실제일까?&quot;&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이를 다루는 게:&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&lt;b&gt;신뢰구간&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;-&amp;gt; &quot;전체는 이 범위 안에 있을 것이다.&quot;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&lt;b&gt;가설검정&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;-&amp;gt; &quot;이 차이가 우연으로 생길 확률은 얼마나 될까?&quot;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&lt;b&gt;1종/2종 오류 &amp;amp; 검정력&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;-&amp;gt; &quot;실수를 얼마나 할 수 있을까?&quot;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;여기까지가 &lt;b&gt;통계적 판단의 기본 틀&lt;/b&gt;입니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이 단계에서 통계는 거의 '언어'처럼 쓰입니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;p-value로 말하고&lt;/li&gt;
&lt;li&gt;신뢰구간으로 설명하고&lt;/li&gt;
&lt;li&gt;효과크기로 설득합니다.&lt;/li&gt;
&lt;/ul&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;3. 회귀분석: &quot;변수 간 관계를 모델링하는 단계&quot;&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;지금까지는 &quot;하나의 숫자(평균&amp;bull;비율)가 다르냐?&quot;를 보는 통계였다면,&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이제부터는 &lt;b&gt;연속적인 관계&lt;/b&gt;를 모델링합니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&lt;b&gt;단순선형회귀&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;-&amp;gt; 한 변수(X)가 변할 때 Y가 어떻게 변하는지&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&lt;b&gt;다중회귀&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;-&amp;gt; 여러 변수가 함께 Y에 영향을 줄 때&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&lt;b&gt;로지스틱 회귀&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;-&amp;gt; Y가 Yes/No일 때&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&lt;b&gt;상관관계 vs 인과관계&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;-&amp;gt; 관계는 볼 수 있지만, 원인을 단정할 수는 없음&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이 단계는&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&quot;데이터로 설명하고 예측하고 싶은 사람&quot;에게 매우 중요합니다.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;4. Count 데이터처럼 더 특수한 상황: &quot;포아송&amp;bull; 음이항 회귀&quot;&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;Y가 숫자가 아니라&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;횟수(1,2,3...)&lt;/b&gt;라면?&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;선형회귀 -&amp;gt; 음수 예측이 나와서 안 됨&lt;/li&gt;
&lt;li&gt;정규성 가정 무너짐&lt;/li&gt;
&lt;li&gt;분산이 커서 포아송도 안 맞음&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;그래서 등장한 모델이&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;포아송 회귀&lt;/li&gt;
&lt;li&gt;음이항 회귀&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;현실의 제조업 데이터는 거의 항상&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;음이항&lt;/b&gt;이 기본입니다.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;5. 실험 설계(DOE): &quot;앞단의 통계를 실제로 써먹는 단계&quot;&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;DOE는 지금까지 배운 개념들이 현장에서 가장 직접적으로 쓰이는 단계입니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;DOE는 다음 질문에 답합니다.&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;어떤 조건이 결과에 영향을 줄까?&lt;/li&gt;
&lt;li&gt;어떤 조합이 최적일까?&lt;/li&gt;
&lt;li&gt;상호작용이 존재할까?&lt;/li&gt;
&lt;li&gt;최소 실험으로 최대한 정보를 얻으려면?&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;DOE의 핵심은&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&quot;통계를 실제 엔지니어링에 적용하는 방법&quot;이라는 점입니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&lt;b&gt;통계의 앞단&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;-&amp;gt; 표본&amp;bull;추정&amp;bull;검정&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;-&amp;gt; 분포 이해&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&lt;b&gt;통계의 중단&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;-&amp;gt; 회귀분석&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;-&amp;gt; 모델링&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&lt;b&gt;통계의 끝단(DOE)&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;-&amp;gt; 실험 계획&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;-&amp;gt; 최적 조건 탐색&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;-&amp;gt; 공정 개선&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;6. 실제 프로젝트 예시로 전체 흐름 파악&lt;/h3&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;&lt;b&gt;상황&lt;/b&gt;&lt;br /&gt;차량 엔진 출력이 들쭉날쭉한 원인을 찾고 싶다.&lt;/blockquote&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&lt;b&gt;1) 데이터 구조 파악&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;표본 수, 평균, 분산을 확인&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;-&amp;gt; 전체 흐름 파악&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&lt;b&gt;2) 확률적 특성 이해&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;정규? 비정규?&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;-&amp;gt; 중심극한정리 적용 가능성 체크&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&lt;b&gt;3) 추정 &amp;amp; 검정&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;새 부품 적용 전/후 출력 차이가 유의한가?&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&lt;b&gt;4) 회귀 모델링&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;연료 분사량, 점화 타이밍, 공기 유량이 출력에 어떤 영향을 주는가?&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&lt;b&gt;5) Count 데이터 처리&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;출력 이상 발생 횟수가 포아송 vs 음이항 중 어디에 가까운가?&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&lt;b&gt;6) DOE로 최적 조건 탐색&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;3~4개 요인으로 2수준 요인 실험&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;-&amp;gt; 상호작용 확인&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;-&amp;gt; 최적 조합 결정&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;7. 한 장 요약&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;단계&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 핵심 질문&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;사용되는 개념&lt;/b&gt;&lt;/p&gt;
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody&gt;
&lt;tr&gt;
&lt;td&gt;표본&amp;middot;요약&lt;/td&gt;
&lt;td&gt;&amp;ldquo;데이터는 어떤 모습인가?&amp;rdquo;&lt;/td&gt;
&lt;td&gt;평균, 분산, 표본추출&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;확률&amp;middot;분포&lt;/td&gt;
&lt;td&gt;&amp;ldquo;어떤 패턴을 따르는가?&amp;rdquo;&lt;/td&gt;
&lt;td&gt;정규분포, 중심극한정리&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;추정&amp;middot;검정&lt;/td&gt;
&lt;td&gt;&amp;ldquo;차이가 의미 있는가?&amp;rdquo;&lt;/td&gt;
&lt;td&gt;p-value, 신뢰구간, 오류&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;회귀분석&lt;/td&gt;
&lt;td&gt;&amp;ldquo;무엇이 영향을 주는가?&amp;rdquo;&lt;/td&gt;
&lt;td&gt;선형&amp;middot;다중&amp;middot;로지스틱 회귀&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;Count 모델&lt;/td&gt;
&lt;td&gt;&amp;ldquo;횟수형 데이터는?&amp;rdquo;&lt;/td&gt;
&lt;td&gt;포아송&amp;middot;음이항 회귀&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;DOE&lt;/td&gt;
&lt;td&gt;&amp;ldquo;최적 조건은 무엇인가?&amp;rdquo;&lt;/td&gt;
&lt;td&gt;요인&amp;middot;수준&amp;middot;상호작용&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;</description>
      <category>Statistics/기초 통계</category>
      <category>DOE</category>
      <category>데이터분석</category>
      <category>분산</category>
      <category>분포</category>
      <category>정규분포</category>
      <category>통계학</category>
      <category>표본</category>
      <category>확률</category>
      <category>회귀모델</category>
      <author>Allen93</author>
      <guid isPermaLink="true">https://allensdatablog.tistory.com/483</guid>
      <comments>https://allensdatablog.tistory.com/entry/26-%EA%B8%B0%EC%B4%88-%ED%86%B5%EA%B3%84%ED%95%99-%EC%B4%9D%EC%A0%95%EB%A6%AC-%EB%AA%A8%EB%93%A0-%EA%B0%9C%EB%85%90%EC%9D%84-%ED%95%98%EB%82%98%EB%A1%9C-%EC%97%B0%EA%B2%B0%ED%95%98%EB%8A%94-%ED%86%B5%EA%B3%84%EC%9D%98-%ED%81%B0-%EA%B7%B8%EB%A6%BC#entry483comment</comments>
      <pubDate>Fri, 20 Feb 2026 00:05:24 +0900</pubDate>
    </item>
    <item>
      <title>26.실험 설계(DOE) 기초 - 현장에서 실패를 줄이고, 성공을 빠르게 만드는 기술</title>
      <link>https://allensdatablog.tistory.com/entry/26%EC%8B%A4%ED%97%98-%EC%84%A4%EA%B3%84DOE-%EA%B8%B0%EC%B4%88-%ED%98%84%EC%9E%A5%EC%97%90%EC%84%9C-%EC%8B%A4%ED%8C%A8%EB%A5%BC-%EC%A4%84%EC%9D%B4%EA%B3%A0-%EC%84%B1%EA%B3%B5%EC%9D%84-%EB%B9%A0%EB%A5%B4%EA%B2%8C-%EB%A7%8C%EB%93%9C%EB%8A%94-%EA%B8%B0%EC%88%A0</link>
      <description>&lt;p data-ke-size=&quot;size16&quot;&gt;제조업(특히 자동차, 전자, 기계)에서 가장 자주 받는 말이 있습니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;&quot;이 조건을 바꿔보면 좋아질까?&quot;&lt;br /&gt;&quot;온도를 조금 올려볼까? 압력은?&quot;&lt;br /&gt;&quot;부품 설계를 약간 변경하면 성능이 개선될까?&quot;&lt;/blockquote&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;문제는...&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;조건은 5가지인데 조합은 수십, 수백 가지가 된다는 점입니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;그래서 경험적으로 하나씩 바꿔보는 방식은&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;시간도 오래 걸리고, 실패할 확률도 높습니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이 문제를 해결하는 강력한 도구가 바로 &lt;b&gt;DOE(Design of Experiments)&lt;/b&gt;입니다.&lt;/p&gt;
&lt;p&gt;&lt;figure class=&quot;imageblock alignCenter&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;1024&quot; data-origin-height=&quot;1024&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/bYWBml/dJMcafyirWx/1nXLQ2omQpOQyAdIbw1kd0/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/bYWBml/dJMcafyirWx/1nXLQ2omQpOQyAdIbw1kd0/img.png&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/bYWBml/dJMcafyirWx/1nXLQ2omQpOQyAdIbw1kd0/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2FbYWBml%2FdJMcafyirWx%2F1nXLQ2omQpOQyAdIbw1kd0%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;572&quot; height=&quot;572&quot; data-origin-width=&quot;1024&quot; data-origin-height=&quot;1024&quot;/&gt;&lt;/span&gt;&lt;/figure&gt;
&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;1. DOE란 무엇인가?&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;한 문장으로 정의하면 이렇습니다.&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;&lt;b&gt;&quot;적은 실험으로 최대한 많은 정보를 얻는 방법&quot;&lt;/b&gt;&lt;/blockquote&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;즉,&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;조건을 무작위로 바꾸는 것이 아니라&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;계획적으로, 체계적으로, 최소한의 횟수로&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;무엇이 결과에 영향을 주는지 알아내는 방식입니다.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;2. 왜 DOE가 필요한가?&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;제조업에서는 실험 하나가 이렇게 생겼습니다:&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;공정 조건 변경 -&amp;gt; 시간 소요&lt;/li&gt;
&lt;li&gt;테스트 장비 작동 -&amp;gt; 비용 발생&lt;/li&gt;
&lt;li&gt;샘플 수집 -&amp;gt; 품질 검사&lt;/li&gt;
&lt;li&gt;결과 측정 -&amp;gt; 재시험 필요&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;즉, 실험 하나에&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;시간, 돈, 인력&lt;/b&gt;이 매우 많이 들어갑니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;그래서 아래 같은 방식은 비효율적입니다:&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;조건 하나씩만 바꾸기(One-factor-at-a-time, OFAT)&lt;/li&gt;
&lt;li&gt;감으로 조건을 선택&lt;/li&gt;
&lt;li&gt;경험에 의존하는 개발 방식&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;DOE는 다음을 가능하게 합니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style3&quot;&gt;최소 실험으로&amp;nbsp;&lt;br /&gt;어떤 요인이 중요하고&lt;br /&gt;어떤 조합이 최적인지&lt;br /&gt;조건 변화가 결과를 얼마나 바꾸는지&lt;br /&gt;상호작용이 존재하는지까지&lt;/blockquote&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;한 번에 파악할 수 있습니다.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;3. DOE의 핵심 개념 한 번에 보기&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;DOE는 크게 3가지 핵심으로 구성됩니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&lt;b&gt;1) 요인(Factor)&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;결과에 영향을 줄 수 있는 변수입니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;자동차 예시:&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;엔진오일 점도&lt;/li&gt;
&lt;li&gt;점화 타이밍&lt;/li&gt;
&lt;li&gt;공기 유량&lt;/li&gt;
&lt;li&gt;압축비&lt;/li&gt;
&lt;li&gt;연료 분사량&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;공정 예시:&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;온도&lt;/li&gt;
&lt;li&gt;압력&lt;/li&gt;
&lt;li&gt;시간&lt;/li&gt;
&lt;li&gt;습도&lt;/li&gt;
&lt;li&gt;속도&lt;/li&gt;
&lt;li&gt;&amp;nbsp;&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이게 &quot;조절 가능한 조건&quot;입니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&lt;b&gt;2) 수준(Level)&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;각 요인의 설정값입니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;예)&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;온도(저: 150&amp;deg;C / 고: 180&amp;deg;C)&lt;/li&gt;
&lt;li&gt;압력(저: 2bar / 고: 4bar)&lt;/li&gt;
&lt;li&gt;시간(10초 / 20초)&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;DOE에서는 보통&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;2 수준(저/고)을 가장 기본적으로 사용합니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&lt;b&gt;3) 반응(Response)&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;조건을 바꿨을 때 결과가 어떻게 변했는지 나타내는 값입니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;예:&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;연비&lt;/li&gt;
&lt;li&gt;출력&lt;/li&gt;
&lt;li&gt;불량률&lt;/li&gt;
&lt;li&gt;고장 시간&lt;/li&gt;
&lt;li&gt;강도&lt;/li&gt;
&lt;li&gt;표면 품질 등&lt;/li&gt;
&lt;/ul&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;4. 가장 많이 쓰는 DOE 방법 - 2 수준 요인 실험 (2^k Factorial)&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;가장 기본적이면서도 가장 강력한 DOE 방법입니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&lt;b&gt;예시&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;조건 3개(온도 T, 압력 P, 시간 S)를 각 2 수준으로 실험한다면:&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;모든 조합 수 = 2&amp;sup3; = &lt;b&gt;8회 실험&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이 8번의 실험만으로:&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;온도가 결과에 얼마나 영향을 주는지&lt;/li&gt;
&lt;li&gt;압력은?&lt;/li&gt;
&lt;li&gt;시간은?&lt;/li&gt;
&lt;li&gt;온도와 압력의 조합은? (상호작용)&lt;/li&gt;
&lt;li&gt;최적 조건은 무엇인지&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;모두 볼 수 있습니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;단 8번의 실험으로요.&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;OFAT 방식이었다면&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;적어도 20 ~ 30번은 필요했을 겁니다.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;5. 상호작용(Interaction)이 정말 중요하다&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;DOE에서 가장 중요한 개념 중 하나가 바로 상호작용입니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;OFAT 방식의 가장 큰 문제가 이거예요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;예시로 '도장 공정'을 보겠습니다:&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;온도 높이면 품질 하락&lt;/li&gt;
&lt;li&gt;점도 낮추면 품질 하락&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;하지만&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;온도를 높이면서 점도를 낮추면 오히려 품질 상승&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;즉,&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;&lt;b&gt;조건&amp;nbsp; A는 단독으로 나쁘지만&lt;/b&gt;&lt;br /&gt;&lt;b&gt;B와 함께 있으면 좋아지는 경우도 많다는 것&lt;/b&gt;&lt;/blockquote&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이걸&amp;nbsp; OFAT 방식으로는 절대 발견할 수 없습니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;하지만 DOE는 상호작용을 한 번에 탐색합니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;제조업에서는 상호작용이 매우 흔합니다.&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;온도 x 습도&lt;/li&gt;
&lt;li&gt;압력 x 속도&lt;/li&gt;
&lt;li&gt;재질 x 공정 시간&lt;/li&gt;
&lt;li&gt;전류 x 온도&lt;/li&gt;
&lt;li&gt;윤활 조건 x 부하&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;상호작용을 고려하지 않으면&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;개선 설계가 오히려 품질을 악화시키는 경우도 생깁니다.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;6. DOE의 실제 활용 예 - 자동차 제조 사례&lt;/h3&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&lt;b&gt;문제&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;신형 엔진의 연비를 개선하고 싶다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&lt;b&gt;요인(Factor)&lt;/b&gt;&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;연료 분사량 (저/고)&lt;/li&gt;
&lt;li&gt;점화 타이밍 (늦게/빠르게)&lt;/li&gt;
&lt;li&gt;공기 유량 (저/고)&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&lt;b&gt;반응(Response)&lt;/b&gt;&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;연비(km/L)&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;DOE 실험 8회 후 결과:&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;연료 분사량: 영향 작음&lt;/li&gt;
&lt;li&gt;점화 타이밍: 영향 큼&lt;/li&gt;
&lt;li&gt;공기 유량: 영향 큼&lt;/li&gt;
&lt;li&gt;(점화 타이밍 x 공기 유량): 매우 중요!&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;결론:&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;연비를 올리는 핵심은&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;점화 타이밍을 빠르게 + 공기 유량을 높이는 조합&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이건 OFAT 방식으로는 절대 발견할 수 없습니다.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;7. 실무자 입장에서 기억해야 할 간단한 DOE&amp;nbsp; 흐름&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;1. 문제 정의&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;2. 요인 목록 만들기&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;3. 각 용인의 수준(값) 설정&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;4. 실험 매트릭스 구성(2^factorial)&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;5. 실험 수행&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;6. 그래프(주효과도, 상호작용도) 분석&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;7. 중요한 요인 선별&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;8. 최적 조건 찾기&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;딱 이 8단계입니다.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;8. 한 장 요약&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;개념&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;의미&lt;/b&gt;&lt;/p&gt;
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody&gt;
&lt;tr&gt;
&lt;td&gt;요인&lt;/td&gt;
&lt;td&gt;결과에 영향을 줄 조건&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;수준&lt;/td&gt;
&lt;td&gt;요인의 값(저/고 등)&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;반응&lt;/td&gt;
&lt;td&gt;실험 결과&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;DOE&lt;/td&gt;
&lt;td&gt;최소 실험으로 최대 정보 얻기&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;2수준 요인 실험&lt;/td&gt;
&lt;td&gt;가장 기본이면서 강력한 DOE&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;상호작용&lt;/td&gt;
&lt;td&gt;단독 영향보다 조합의 영향이 중요할 수 있음&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;</description>
      <category>Statistics/기초 통계</category>
      <category>Ai</category>
      <category>DOE</category>
      <category>데이터분석</category>
      <category>데이터사이언스</category>
      <category>반응</category>
      <category>빅데이터</category>
      <category>수준</category>
      <category>실험설계</category>
      <category>요인</category>
      <category>통계</category>
      <author>Allen93</author>
      <guid isPermaLink="true">https://allensdatablog.tistory.com/482</guid>
      <comments>https://allensdatablog.tistory.com/entry/26%EC%8B%A4%ED%97%98-%EC%84%A4%EA%B3%84DOE-%EA%B8%B0%EC%B4%88-%ED%98%84%EC%9E%A5%EC%97%90%EC%84%9C-%EC%8B%A4%ED%8C%A8%EB%A5%BC-%EC%A4%84%EC%9D%B4%EA%B3%A0-%EC%84%B1%EA%B3%B5%EC%9D%84-%EB%B9%A0%EB%A5%B4%EA%B2%8C-%EB%A7%8C%EB%93%9C%EB%8A%94-%EA%B8%B0%EC%88%A0#entry482comment</comments>
      <pubDate>Tue, 17 Feb 2026 10:26:43 +0900</pubDate>
    </item>
    <item>
      <title>25. 표본 크기와 검정력(Power)의 실무적 의미</title>
      <link>https://allensdatablog.tistory.com/entry/25-%ED%91%9C%EB%B3%B8-%ED%81%AC%EA%B8%B0%EC%99%80-%EA%B2%80%EC%A0%95%EB%A0%A5Power%EC%9D%98-%EC%8B%A4%EB%AC%B4%EC%A0%81-%EC%9D%98%EB%AF%B8</link>
      <description>&lt;p data-ke-size=&quot;size18&quot;&gt;&lt;b&gt;- &quot;데이터는 많으면 무조건 좋은 걸까?&quot;&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이 내용은 정말 중요합니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;특히 제조업, 자동차 분야처럼 테스트 비용이 크고, 실험 여건이 제한되는 환경에서는&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;표본 크기 결정(sample size determination)&lt;/b&gt;이 분석 능력의 절반이라고 해도 과언이 아닙니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이번 글에서는&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&quot;표본이 많으면 좋다&quot; 같은 단순한 말이 아니라,&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;왜? 얼마나? 어떤 기준으로?&lt;/b&gt;&lt;br /&gt;이 부분을 명확하게 이해할 수 있도록 직관 중심으로 설명하겠습니다.&lt;/p&gt;
&lt;p&gt;&lt;figure class=&quot;imageblock alignCenter&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;1024&quot; data-origin-height=&quot;1024&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/dhp7gQ/dJMcai9yiWK/YLPPbKNoSe3ehXIInbYkm1/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/dhp7gQ/dJMcai9yiWK/YLPPbKNoSe3ehXIInbYkm1/img.png&quot; data-alt=&quot;표본 크기와 검정력&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/dhp7gQ/dJMcai9yiWK/YLPPbKNoSe3ehXIInbYkm1/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2Fdhp7gQ%2FdJMcai9yiWK%2FYLPPbKNoSe3ehXIInbYkm1%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;623&quot; height=&quot;623&quot; data-origin-width=&quot;1024&quot; data-origin-height=&quot;1024&quot;/&gt;&lt;/span&gt;&lt;figcaption&gt;표본 크기와 검정력&lt;/figcaption&gt;
&lt;/figure&gt;
&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;1. 표본 크기가 왜 중요한가?&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;통계에서 표본 크기는 단순히 &quot;데이터 양&quot;이 아닙니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;표본 크기는 &lt;b&gt;결과의 신뢰성, 유의성, 재현성, 비용&lt;/b&gt;을 모두 결정하는 핵심 변수입니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;너무 적으면 -&amp;gt; 결과가 흔들림&lt;/li&gt;
&lt;li&gt;너무 많으면 -&amp;gt; 비용 낭비 &amp;amp; &quot;쓸데없이 유의한 결과&quot; 발생&lt;/li&gt;
&lt;li&gt;적당해야 -&amp;gt; 의미 있으면서도 실용적인 판단 가능&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이걸 결정해 주는 개념이 &lt;b&gt;검정력(Power)&lt;/b&gt;입니다.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;2. 먼저, &quot;유의성(significance)&quot;이 무엇인지 다시 보자&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;가설검정에서 흔히 말하는 p-value는 다음 질문에 답합니다.&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;&quot;그냥 우연으로 이렇게 큰 차이가 나타날 확률은 얼마나 될까?&quot;&lt;/blockquote&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;p &amp;lt; 0.05라면&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;우리는 &quot;우연으로 보기 어렵다 -&amp;gt; 효과 있음&quot;이라고 해석하죠.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;그런데 여기엔 큰 문제가 있습니다.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;3. 표본이 너무 많으면 &quot;별 의미 없는 차이도 전부 유의&quot;해진다&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;예를 들어 자동차 엔진 테스트에서:&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;A 모델 연비 : 15.0km/L&lt;/li&gt;
&lt;li&gt;B 모델 연비 : 15.1km/L&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;차이는 0.1km/L밖에 안 됩니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;운전자 입장에서는 체감도 없고, 제조 비용 대비 의미도 없음.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;그런데 표본이 1만 대면 p-value는 거의 0에 가까워지고,&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&quot;통계적으로 유의한 차이!&quot;라고 나옵니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;하지만 실제로는 &lt;b&gt;아무 의미 없는 차이&lt;/b&gt;입니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이게 바로 표본 크기가 너무 많으면 생기는 &lt;b&gt;유의성의 함정&lt;/b&gt;입니다.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;4. 반대로 표본이 너무 적으면 &quot;중요한 차이도 못 잡는다&quot;&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이번엔 반대 상황을 보죠.&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;A 모델 제동거리: 평균 39.0m&lt;/li&gt;
&lt;li&gt;B 모델 제동거리: 평균 41.0m&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;차이 2m는 매우 의미 있습니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;하지만 표본이 5대씩밖에 없다면?&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;분산이 조금만 커도&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&quot;유의하지 않음(p &amp;gt; 0.05)&quot;이 나옵니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이런 상황은 실무에서 매우 빈번합니다:&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;테스트 비용이 커서 데이터를 많이 못 모을 때&lt;/li&gt;
&lt;li&gt;QA 샘플링이 제한될 때&lt;/li&gt;
&lt;li&gt;고가 장비 테스트(진동시험, 엔진 다이나모 등)&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;결국 중요한 차이를 놓치게 됩니다.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;5. 그래서 등장하는 개념: 검정력(Power)&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;Power는 이렇게 정의됩니다.&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;&lt;b&gt;&quot;진짜 효과가 있을 때, 그걸 제대로 찾아낼 확률&quot;&lt;/b&gt;&lt;/blockquote&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;즉,&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;놓쳐서는 안 되는 것을 놓치지 않을 확률입니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;공식으로는:&lt;/p&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&lt;b&gt;Power = 1 - 2종오류(&amp;beta;)&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;1종 오류 (&amp;alpha;) &lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;-&amp;gt; 효과가 없는 데 있다고 판정&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;-&amp;gt;&quot;잘못된 경보&quot;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt; ✔ 2종 오류 (&amp;beta;) &lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;-&amp;gt; 효과가 있는데 없다고 판정&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;-&amp;gt; &quot;놓쳐버리는 실수&quot;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;Power는 그 중 &lt;b&gt;&amp;beta;를 줄이는 것,&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;즉 &quot;놓치지 않는 능력&quot;입니다.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;6. 검정력을 결정하는 4가지 요소&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;검정력은 4가지 요소가 균형을 이뤄야 합니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;요소&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 의미&lt;/b&gt;&lt;/p&gt;
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody&gt;
&lt;tr&gt;
&lt;td&gt;&lt;b&gt;1) 표본 크기 n&lt;/b&gt;&lt;/td&gt;
&lt;td&gt;많을수록 검정력 &amp;uarr;&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;&lt;b&gt;2) 효과 크기(effect size)&lt;/b&gt;&lt;/td&gt;
&lt;td&gt;차이가 클수록 검정력 &amp;uarr;&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;&lt;b&gt;3) 데이터의 변동성(&amp;sigma;)&lt;/b&gt;&lt;/td&gt;
&lt;td&gt;변동성이 적을수록 &amp;uarr;&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;&lt;b&gt;4) 유의수준 &amp;alpha;&lt;/b&gt;&lt;/td&gt;
&lt;td&gt;느슨하게(0.05&amp;rarr;0.10) 하면 &amp;uarr;&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이 중 &lt;b&gt;표본 크기가 가장 쉽게 조절 가능한 요소&lt;/b&gt;입니다.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;7. 실제 제조업 예시로 이해해 보자&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;상황&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;새로운 엔진 오일이 연비를 개선하는지 확인하고 싶다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;A. 효과 크기&lt;/b&gt;&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;기존 연비: 15.0&lt;/li&gt;
&lt;li&gt;개선 목표: +1.0km/L&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp; &amp;nbsp; -&amp;gt; 효과 크기 = 1.0&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;B. 변동성&lt;/b&gt;&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;엔진 테스트마다 연비는 0.8 ~ 1.2 정도 흔들림&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;-&amp;gt; &amp;sigma; &amp;asymp; 1.0&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;C. 원하는 Power&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;보통 Power는 0.8(= 80%) 이상 권장&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이 상황에서 필요한 표본 크기를 계산하면:&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;대략 16~20대&lt;/blockquote&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;그런데 5대만 테스트하면?&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;변동성 때문에 차이가 안 보일 확률이 높음&lt;/li&gt;
&lt;li&gt;중요한 개선을 놓칠 위험 증가&lt;/li&gt;
&lt;li&gt;개발팀은 &quot;효과 없음&quot;이라고 판단&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이런 일이 실제로 매우 자주 발생합니다.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;8. Power 분석이 실무에서 중요한 이유&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&lt;b&gt;테스트 비용 절감&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;자동차 엔진 테스트 한 번에 수백만~수천만 원이 들어가죠.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;Power 분석이 없으면 &quot;필요 이상의 테스트&quot;를 하게 됩니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&lt;b&gt;실험 실패 방지&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;표본 수가 부족하면&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;중요한 개선점을 놓치고 제품 결함을 그대로 두게 됩니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&lt;b&gt;불량률, 고장률 검증에 필수&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;특히 다음 같은 판단에서는 Power가 절대 필요합니다.&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;공정 개선 전/후 불량률 비교&lt;/li&gt;
&lt;li&gt;신모델 vs 구모델 고장률 비교&lt;/li&gt;
&lt;li&gt;공급업체 품질 차이 분석&lt;/li&gt;
&lt;li&gt;안전시험 통과 여부 판단&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&lt;b&gt;데이터 기반 의사결정의 신뢰성 확보&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;표본 수만 잘못 잡아도&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;모든 결과가 뒤틀립니다.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;9. 한 장 요약&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;개념&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;핵심&lt;/b&gt;&lt;/p&gt;
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody&gt;
&lt;tr&gt;
&lt;td&gt;표본 크기&lt;/td&gt;
&lt;td&gt;많으면 유의성 과장, 적으면 중요한 차이 놓침&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;검정력 Power&lt;/td&gt;
&lt;td&gt;진짜 차이를 놓치지 않는 능력&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;중요 요소&lt;/td&gt;
&lt;td&gt;n, 효과크기, &amp;sigma;, &amp;alpha;&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;실무 포인트&lt;/td&gt;
&lt;td&gt;테스트 비용 vs 검정력 &amp;rarr; 적정 표본 수 결정&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;blockquote data-ke-style=&quot;style1&quot;&gt;&lt;span style=&quot;font-family: 'Noto Serif KR';&quot;&gt;표본 크기와 검정력은 단순한 통계 개념이 아니라&lt;br /&gt;&lt;/span&gt;실험 설계와 품질 검증의 중심입니다.&lt;/blockquote&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;</description>
      <category>Statistics/기초 통계</category>
      <category>1종</category>
      <category>2종</category>
      <category>Power</category>
      <category>검정력</category>
      <category>데이터분석</category>
      <category>데이터사이언스</category>
      <category>유의성</category>
      <category>통계</category>
      <category>표본크기</category>
      <author>Allen93</author>
      <guid isPermaLink="true">https://allensdatablog.tistory.com/481</guid>
      <comments>https://allensdatablog.tistory.com/entry/25-%ED%91%9C%EB%B3%B8-%ED%81%AC%EA%B8%B0%EC%99%80-%EA%B2%80%EC%A0%95%EB%A0%A5Power%EC%9D%98-%EC%8B%A4%EB%AC%B4%EC%A0%81-%EC%9D%98%EB%AF%B8#entry481comment</comments>
      <pubDate>Sat, 14 Feb 2026 09:25:30 +0900</pubDate>
    </item>
    <item>
      <title>24. 포아송 회귀 vs 음이항 회귀</title>
      <link>https://allensdatablog.tistory.com/entry/24-%ED%8F%AC%EC%95%84%EC%86%A1-%ED%9A%8C%EA%B7%80-vs-%EC%9D%8C%EC%9D%B4%ED%95%AD-%ED%9A%8C%EA%B7%80</link>
      <description>&lt;h3 data-ke-size=&quot;size23&quot;&gt;고장 횟수 데이터는 왜 일반 회귀로 처리하면 안 될까?&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;제조업, 자동차 업계 데이터를 분석하다 보면&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;&quot;횟수(Count)&quot; 형태의 데이터&lt;/b&gt;가 정말 자주 등장합니다.&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;차량 A의 월별 고장 횟수&lt;/li&gt;
&lt;li&gt;공장 라인의 시간당 불량 건수&lt;/li&gt;
&lt;li&gt;특정 오류 코드 발생 횟수&lt;/li&gt;
&lt;li&gt;하루 동안 클레임(항의) 발생 수&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이런 값들은 0,1,2,3, ... 처럼 &quot;정수이고,&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;음수는 절대 없고,&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;대부분 &lt;b&gt;0에 가깝고, 가끔 크게 튀는 값들이 있는 형태&lt;/b&gt;를 보이죠.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;여기서 중요한 질문이 하나 생깁니다.&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;&quot;이런 데이터를 왜 선형회귀로 예측하면 안 될까?&quot;&lt;/blockquote&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이유는 간단합니다.&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;선형회귀는 예측값이&lt;b&gt; 음수가 될 수 있음&lt;/b&gt;&lt;/li&gt;
&lt;li&gt;정규분포 기반이라 &lt;b&gt;분산이 일정하다고 가정함&lt;/b&gt;&lt;/li&gt;
&lt;li&gt;count 데이터는 본질적으로 &lt;b&gt;분포가 완전히 다름&lt;/b&gt;&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;그래서 등장하는 모델이&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;포아송 회귀(Posson Regression)&lt;/b&gt;와&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;그 한계를 해결한 &lt;b&gt;음이항 회귀(Negative Binominal Regression)&lt;/b&gt;입니다.&lt;/p&gt;
&lt;p&gt;&lt;figure class=&quot;imageblock alignCenter&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;1024&quot; data-origin-height=&quot;1024&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/tEGqJ/dJMcabCCxHb/VJIidL0zlRkfkzv6oqlRj1/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/tEGqJ/dJMcabCCxHb/VJIidL0zlRkfkzv6oqlRj1/img.png&quot; data-alt=&quot;포아송-음이항&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/tEGqJ/dJMcabCCxHb/VJIidL0zlRkfkzv6oqlRj1/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2FtEGqJ%2FdJMcabCCxHb%2FVJIidL0zlRkfkzv6oqlRj1%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;682&quot; height=&quot;682&quot; data-origin-width=&quot;1024&quot; data-origin-height=&quot;1024&quot;/&gt;&lt;/span&gt;&lt;figcaption&gt;포아송-음이항&lt;/figcaption&gt;
&lt;/figure&gt;
&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;1. 포아송 분포(Possion Distribution) - &quot;희귀한 사건의 횟수&quot;&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;포아송 분포는 한 문장으로 정리하면&amp;nbsp; 이렇습니다.&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;&lt;b&gt;&quot;단위 시간/공간에서 어떤 사건이 몇 번 발생하는 가?&quot;&lt;/b&gt;&lt;/blockquote&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;제조업 예시로는:&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;하루 동안 불량이 몇 개 발생했는가&lt;/li&gt;
&lt;li&gt;한 달 동안 특정 엔진에서 고장이 몇 번 났는가&lt;/li&gt;
&lt;li&gt;1,000대당 클레임이 몇 건 발생했는가&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이런 데이터가 전형적인 &lt;b&gt;포아송 데이터&lt;/b&gt;입니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;포아송 분포의 핵심 가정이 하나 있습니다:&lt;/p&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&lt;b&gt;평균 = 분산&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;예를 들어 평균 고장 횟수가 2회라면,&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;고장 횟수의 분산도 2여야 한다는 뜻.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;여기서 문제가 발생합니다.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;2. 제조업, 자동차 데이터는 &quot;과대산포(Overdispersion)&quot;가 거의 항상 존재한다&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;현실 데이터에서는 대부분&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;분산이 평균보다 훨씬 크다&lt;/b&gt;는 문제가 생깁니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이걸 &lt;b&gt;과대산포(Over-dispersion)&lt;/b&gt;라고 불러요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;예시로 볼까요?&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&lt;b&gt;예: A공장의 일일 불량 데이터&lt;/b&gt;&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;평균(&amp;lambda;) = 2&lt;/li&gt;
&lt;li&gt;분산 = 15&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;분산이 평균보다&lt;b&gt; 7~8배 이상 커짐&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;-&amp;gt; 포아송 가정과 완전히 다름&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;왜 이런 일이 생길까요?&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;특정 날은 설비 이상으로 불량이 몰림&lt;/li&gt;
&lt;li&gt;공정 자체가 일정하지 않음&lt;/li&gt;
&lt;li&gt;환경 조건(온도, 습도)이 크게 흔들림&lt;/li&gt;
&lt;li&gt;제품 종류가 매일 조금씩 다름&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;즉, &lt;b&gt;현실의 제조 데이터는 균일하지 않다&lt;/b&gt;는 뜻입니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;포아송 분포는 이런 &quot;불균일성&quot;을 설명하지 못합니다.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;3. 그래서 등장한 모델 - &quot;음이항 회귀&quot;&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;음이항(Negative Binominal) 회귀는&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;포아송의 핵심 가정을 완화한 모델입니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;핵심 차이는 딱 하나:&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;&lt;b&gt;포아송: 평균 = 분산&lt;/b&gt;&lt;br /&gt;&lt;b&gt;음이항: 분산 &amp;gt;= 평균&lt;/b&gt; (항상 더 큼)&lt;/blockquote&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;음이항 모델은 분산을 다음처럼 표현합니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&lt;b&gt; &lt;span&gt;&lt;span&gt;Va&lt;/span&gt;&lt;span&gt;r&lt;/span&gt;&lt;span&gt;(&lt;/span&gt;&lt;span&gt;Y&lt;/span&gt;&lt;span&gt;) &lt;/span&gt;&lt;span&gt;= &lt;/span&gt;&lt;/span&gt;&lt;span&gt;&lt;span&gt;&amp;mu; &lt;/span&gt;&lt;span&gt;+ &lt;/span&gt;&lt;/span&gt;&lt;span&gt;&lt;span&gt;&amp;alpha;&lt;/span&gt;&lt;span&gt;&lt;span&gt;&amp;mu;&amp;sup2;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt; &lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;alpha;(알파)가 0이면 포아송과 동일하지만,&lt;br /&gt;&amp;alpha;가 커질수록 &lt;b&gt;분산이 훨씬 커지는 데이터&lt;/b&gt;를 설명합니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;즉, 제조업처럼 &quot;일부 날에 불량 폭발처럼 튀는 패턴&quot;을 잘 설명합니다.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;4. 포아송 vs 음이항 - 실제 데이터로 비교&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;예를 들어 30일 동안 부품 불량 건수가 다음과 같습니다.&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;대부분 0~2개&lt;/li&gt;
&lt;li&gt;가끔 5~10개&lt;/li&gt;
&lt;li&gt;특정 날 20개 발생&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이런 데이터에 포아송 회귀를 사용하면:&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;평균 2로 수렴&lt;/li&gt;
&lt;li&gt;20 같은 값을 절대 설명 못함&lt;/li&gt;
&lt;li&gt;모델이 왜곡됨&lt;/li&gt;
&lt;li&gt;p-value 엉터리&lt;/li&gt;
&lt;li&gt;예측력 심각하게 떨어짐&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;반대로 음이항 회귀는:&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;&quot;불량이 몰리는 날이 있다&quot;는 특성까지 반영&lt;/li&gt;
&lt;li&gt;평균과 분산 차이를 자연스럽게 해석&lt;/li&gt;
&lt;li&gt;계수(p-value)가 안정적&lt;/li&gt;
&lt;li&gt;예측력도 개선&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;그래서 통계에서는 이렇게 말합니다:&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;&lt;b&gt;&quot;현실의 count 데이터는 음이항이 기본이고,&lt;/b&gt;&lt;br /&gt;&lt;b&gt;포아송은 특별한 경우만 사용한다.&quot;&lt;/b&gt;&lt;/blockquote&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;5. 제조업, 자동차에서 대표적으로 음이항 모델이 필요한 상황&lt;/h3&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;고장 횟수가 차량마다 들쭉날쭉&lt;/li&gt;
&lt;li&gt;모델별, 공장별로 품질 편차가 큼&lt;/li&gt;
&lt;li&gt;특정 기간에 불량이 몰리는 경우&lt;/li&gt;
&lt;li&gt;공정 환경 변화로 분포가 크게 흔들릴 때&lt;/li&gt;
&lt;li&gt;&quot;0이 너무 많은&quot; 데이터&lt;/li&gt;
&lt;li&gt;장비별 편차가 심할 때&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이건 포아송이 &lt;b&gt;전혀 설명할 수 없는 특성들&lt;/b&gt;입니다.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;6. 어떻게 판단할까? (실제 분석에서 필요한 기준)&lt;/h3&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&lt;b&gt;1) 분산이 평균보다 크면 -&amp;gt; 음이항&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;협소하게 보면&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;Mean = 2&lt;/li&gt;
&lt;li&gt;Variance = 2 -&amp;gt; 포아송 가능&lt;/li&gt;
&lt;li&gt;Variance = 6 -&amp;gt; 음이항 거의 확실&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&lt;b&gt;2) 포아송 회귀 돌려보고 &quot;잔차 분산이 너무 크면&quot; -&amp;gt; 음이항&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&lt;b&gt;3) AIC 비교&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;음이항이 더 낮으면 (대부분) 음이항 채택&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;7. 한 장 요약&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;항목&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 포아송 회귀&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;음이항 회귀&lt;/b&gt;&lt;/p&gt;
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody&gt;
&lt;tr&gt;
&lt;td&gt;가정&lt;/td&gt;
&lt;td&gt;평균=분산&lt;/td&gt;
&lt;td&gt;분산 &amp;ge; 평균&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;분산이 큰 데이터&lt;/td&gt;
&lt;td&gt;처리 ❌&lt;/td&gt;
&lt;td&gt;처리 ⭕&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;현실성&lt;/td&gt;
&lt;td&gt;낮음&lt;/td&gt;
&lt;td&gt;매우 높음&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;제조/자동차 적합성&lt;/td&gt;
&lt;td&gt;드묾&lt;/td&gt;
&lt;td&gt;거의 항상 적합&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;과대산포 해결&lt;/td&gt;
&lt;td&gt;불가능&lt;/td&gt;
&lt;td&gt;가능&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style1&quot;&gt;&lt;span style=&quot;font-family: 'Noto Serif KR';&quot;&gt;실무 요약 : Count 데이터는 일단 음이항을 먼저 고민하고,&lt;br /&gt;&lt;/span&gt;아주 균일한 경우에만 포아송을 사용한다.&lt;/blockquote&gt;</description>
      <category>Statistics/기초 통계</category>
      <category>고장</category>
      <category>데이터분석</category>
      <category>데이터사이언스</category>
      <category>분산</category>
      <category>분포</category>
      <category>음이항</category>
      <category>통계</category>
      <category>평균</category>
      <category>포아송</category>
      <author>Allen93</author>
      <guid isPermaLink="true">https://allensdatablog.tistory.com/480</guid>
      <comments>https://allensdatablog.tistory.com/entry/24-%ED%8F%AC%EC%95%84%EC%86%A1-%ED%9A%8C%EA%B7%80-vs-%EC%9D%8C%EC%9D%B4%ED%95%AD-%ED%9A%8C%EA%B7%80#entry480comment</comments>
      <pubDate>Thu, 12 Feb 2026 10:14:30 +0900</pubDate>
    </item>
    <item>
      <title>23. 분류 모델 평가 지표 - Accuracy만 보면 큰일 나는 이유</title>
      <link>https://allensdatablog.tistory.com/entry/23-%EB%B6%84%EB%A5%98-%EB%AA%A8%EB%8D%B8-%ED%8F%89%EA%B0%80-%EC%A7%80%ED%91%9C-Accuracy%EB%A7%8C-%EB%B3%B4%EB%A9%B4-%ED%81%B0%EC%9D%BC-%EB%82%98%EB%8A%94-%EC%9D%B4%EC%9C%A0</link>
      <description>&lt;p data-ke-size=&quot;size16&quot;&gt;분류 모델을 처음 만들면 대부분 이렇게 말합니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;&quot;정확도(Accuracy)가 95%라니, 모델 잘 나오네!&quot;&lt;/blockquote&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;하지만 제조업/자동차, 의료 같은 분야에서는&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;Accuracy만 믿으면 큰 사고가 납니다.&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;왜냐하면...&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;불량률이 1%만 되어도&lt;/li&gt;
&lt;li&gt;Accuracy는 아무것도 안 해도 99%가 나오거든요.&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;예를 들어 공장에서 1000개 중 10개만 불량이라면&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;모델이 &quot;모두 정상&quot;이라고만 말해도 Accuracy는 99%입니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이건 좋은 모델이 아니라&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;사실상 아무것도 못 맞춘 모델&lt;/b&gt;이죠.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;그래서 필요한 것이 Precision, Recall, F1, AUC 같은 지표들입니다.&lt;/p&gt;
&lt;p&gt;&lt;figure class=&quot;imageblock alignCenter&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;1536&quot; data-origin-height=&quot;1024&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/bnOgyO/dJMcajm29bW/O2IAGQprbfW80x2IPh5KA0/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/bnOgyO/dJMcajm29bW/O2IAGQprbfW80x2IPh5KA0/img.png&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/bnOgyO/dJMcajm29bW/O2IAGQprbfW80x2IPh5KA0/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2FbnOgyO%2FdJMcajm29bW%2FO2IAGQprbfW80x2IPh5KA0%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;675&quot; height=&quot;450&quot; data-origin-width=&quot;1536&quot; data-origin-height=&quot;1024&quot;/&gt;&lt;/span&gt;&lt;/figure&gt;
&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;1. Accracy - 전체 중 맞춘 비율 (가장 단순, 그래서 위험)&lt;/h3&gt;
&lt;p&gt;&lt;figure class=&quot;imageblock alignLeft&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;211&quot; data-origin-height=&quot;66&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/b67wnf/dJMcah3TlpL/zfiCczsw3xHK7yWCOpgesK/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/b67wnf/dJMcah3TlpL/zfiCczsw3xHK7yWCOpgesK/img.png&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/b67wnf/dJMcah3TlpL/zfiCczsw3xHK7yWCOpgesK/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2Fb67wnf%2FdJMcah3TlpL%2FzfiCczsw3xHK7yWCOpgesK%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;211&quot; height=&quot;66&quot; data-origin-width=&quot;211&quot; data-origin-height=&quot;66&quot;/&gt;&lt;/span&gt;&lt;/figure&gt;
&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;TP : 진짜 불량을 맞춘 경우&lt;/li&gt;
&lt;li&gt;TN : 진짜 정상을 맞춘 경우&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;문제는..&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;불량이 희귀하면 Accuracy는 늘 높게 나옵니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&lt;b&gt;문제 예시&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;공장에서 하루 1만 개 중 10개가 불량이면,&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;모델이 &quot;전부 정상&quot;이라고 해도 Accuracy는 99.9%&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;하지만 이 모델은 &lt;b&gt;불량을 1개도 못 잡음.&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;그래서 Accuracy는 분류 문제의 본질을 반영하지 못합니다.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;2. Precision - &quot;잡았다!&quot; 중에 진짜 불량이 얼마나 되는가&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;Precision은 이런 질문에 답합니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;&quot;불량이라고 판정한 것 중에서,&lt;br /&gt;실제로 불량인 건 얼마나 될까?&quot;&lt;/blockquote&gt;
&lt;p&gt;&lt;figure class=&quot;imageblock alignLeft&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;211&quot; data-origin-height=&quot;67&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/E0Rep/dJMcacVOEaw/lHSWqIww6OOBe5MRfb9X61/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/E0Rep/dJMcacVOEaw/lHSWqIww6OOBe5MRfb9X61/img.png&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/E0Rep/dJMcacVOEaw/lHSWqIww6OOBe5MRfb9X61/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2FE0Rep%2FdJMcacVOEaw%2FlHSWqIww6OOBe5MRfb9X61%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;211&quot; height=&quot;67&quot; data-origin-width=&quot;211&quot; data-origin-height=&quot;67&quot;/&gt;&lt;/span&gt;&lt;/figure&gt;
&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;FP(False Positive) = 정상인데 불량이라고 잘못 찍은 것&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&lt;b&gt;제조업 예시&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;불량으로 분류한 50개 중에서&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;진짜 불량이 40개면 Precision은 80%.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;즉,&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;경보를 울릴 때 얼마나 정확한가?&quot;&lt;/b&gt;를 측정합니다.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;3. Recall - &quot;진짜 불량&quot;을 얼마나 놓치지 않았는가&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;Recall은 다음 질문에 답합니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;&quot;전체 불량 중에서,&lt;br /&gt;모델이 얼마나 많이 잡아냈는가?&quot;&lt;/blockquote&gt;
&lt;p&gt;&lt;figure class=&quot;imageblock alignLeft&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;182&quot; data-origin-height=&quot;71&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/cc4a4u/dJMcacars2j/fFcnSR11HSvd73fMGKvxk1/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/cc4a4u/dJMcacars2j/fFcnSR11HSvd73fMGKvxk1/img.png&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/cc4a4u/dJMcacars2j/fFcnSR11HSvd73fMGKvxk1/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2Fcc4a4u%2FdJMcacars2j%2FfFcnSR11HSvd73fMGKvxk1%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;182&quot; height=&quot;71&quot; data-origin-width=&quot;182&quot; data-origin-height=&quot;71&quot;/&gt;&lt;/span&gt;&lt;/figure&gt;
&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;FN(False Negative) = 불량인데 정상으로 판정한 경우&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&lt;b&gt;제조업 예시&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;전체 불량 100개 중&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;70개만 잡았다면 Recall 70%.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;즉,&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;불량을 놓치지 않는 능력입&lt;/b&gt;니다.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;4. Precision vs Recall - 둘 다 높이기 어려운 이유&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이 두 지표는 &quot;Trade Off 관계&quot;입니다.&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;Precision을 높이면 -&amp;gt; Recall이 떨어지고&lt;/li&gt;
&lt;li&gt;Recall을 높이면 -&amp;gt; Precision이 떨어집니다&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&lt;b&gt;비유 : 공장 불량 검사기&lt;/b&gt;&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;아주 까다롭게 검사하면 -&amp;gt; 오탐(False Positive)이 늘고 Precision 낮아짐&lt;/li&gt;
&lt;li&gt;아주 느슨하게 검사하면 -&amp;gt; 불량을 놓치기 쉬워 Recall이 낮아짐&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;그래서 둘 사이 균형을 맞춰야 합니다.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;5. F1-score -- Precision과 Recall을 한 번에 본다&lt;/h3&gt;
&lt;p&gt;&lt;figure class=&quot;imageblock alignLeft&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;265&quot; data-origin-height=&quot;64&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/KriEt/dJMcadf4p0B/MmGMgnlWnM3GiqTJckKjV0/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/KriEt/dJMcadf4p0B/MmGMgnlWnM3GiqTJckKjV0/img.png&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/KriEt/dJMcadf4p0B/MmGMgnlWnM3GiqTJckKjV0/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2FKriEt%2FdJMcadf4p0B%2FMmGMgnlWnM3GiqTJckKjV0%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;265&quot; height=&quot;64&quot; data-origin-width=&quot;265&quot; data-origin-height=&quot;64&quot;/&gt;&lt;/span&gt;&lt;/figure&gt;
&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;F1은 Precision과 Recall의 &lt;b&gt;조화평균&lt;/b&gt;입니다.&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;둘 중 하나라도 낮으면 F1이 확 떨어짐&lt;/li&gt;
&lt;li&gt;둘이 적당히 균형을 이루는 모델이 좋은 모델&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;그래서 제조업 불량 검출처럼&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&quot;놓치면 절대 안 되는&quot; 문제에서는 F1이 매우 중요합니다.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;6. ROC Curve &amp;amp; AUC - 임계값을 고려한 가장 직관적 지표&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;로지스틱 회귀는 &quot;확률(p)&quot;을 예측하므로&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;여기서 0.5로 분류할지, 0.4로 할지, 0.7로 할지에 따라 결과가 달라집니다.&lt;/p&gt;
&lt;p&gt;&lt;figure class=&quot;imageblock alignCenter&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;800&quot; data-origin-height=&quot;545&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/kGOk8/dJMcajtOOyY/rFj6Ajp5STnmrbkVlKvDv0/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/kGOk8/dJMcajtOOyY/rFj6Ajp5STnmrbkVlKvDv0/img.png&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/kGOk8/dJMcajtOOyY/rFj6Ajp5STnmrbkVlKvDv0/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2FkGOk8%2FdJMcajtOOyY%2FrFj6Ajp5STnmrbkVlKvDv0%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;585&quot; height=&quot;399&quot; data-origin-width=&quot;800&quot; data-origin-height=&quot;545&quot;/&gt;&lt;/span&gt;&lt;/figure&gt;
&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;ROC 곡선은&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;모든 임계값을 변경해 가며&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;모델의 전체적인 성능을 보여줍니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;가로축 : False Positive Rate&lt;/li&gt;
&lt;li&gt;세로축 : True Positive Rate ( = Recall)&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;AUC는 ROC 곡선 아래 면적&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;-&amp;gt; 0.5 : 무조건 랜덤&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;-&amp;gt; 0.8 이상 : 준수&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;-&amp;gt; 0.9 이상 : 매우 강력&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;즉,&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;AUC는 &quot;임계값에 상관없이 전체적인 모델력이 어떤지&quot;를 알려주는 지표.&lt;/blockquote&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;7. 자동차 ● 제조업 예시로 전체 정리&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;자동차 부품 고장 예측 모델을 만든다고 생각해 봅시다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;지표&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;의미&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 제조업에서의 해석&lt;/b&gt;&lt;/p&gt;
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody&gt;
&lt;tr&gt;
&lt;td&gt;Accuracy&lt;/td&gt;
&lt;td&gt;전체 중 맞춘 비율&lt;/td&gt;
&lt;td&gt;불량이 희귀하면 거의 무의미&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;Precision&lt;/td&gt;
&lt;td&gt;&amp;ldquo;잡았다&amp;rdquo; 중 진짜 불량 비율&lt;/td&gt;
&lt;td&gt;정상 제품을 괜히 버리는 비율&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;Recall&lt;/td&gt;
&lt;td&gt;전체 불량 중 잘 잡은 비율&lt;/td&gt;
&lt;td&gt;놓치는 불량의 수 &amp;rarr; 가장 중요&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;F1&lt;/td&gt;
&lt;td&gt;Precision&amp;middot;Recall 균형&lt;/td&gt;
&lt;td&gt;불량 검출 모델 핵심&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;AUC&lt;/td&gt;
&lt;td&gt;전체적 모델 성능&lt;/td&gt;
&lt;td&gt;임계값 변화에 영향 없음&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;결국 제조업, 의료처럼 &lt;b&gt;놓치면 큰 문제가 되는 분야&lt;/b&gt;에서는&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;Recall&lt;/li&gt;
&lt;li&gt;F1&lt;/li&gt;
&lt;li&gt;AUC&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이 세 가지가 가장 중요합니다.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;8. 한 장 요약&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;지표&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 핵심 질문&lt;/b&gt;&lt;/p&gt;
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody&gt;
&lt;tr&gt;
&lt;td&gt;Accuracy&lt;/td&gt;
&lt;td&gt;&amp;ldquo;전체적으로 얼만큼 맞췄나?&amp;rdquo;&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;Precision&lt;/td&gt;
&lt;td&gt;&amp;ldquo;불량이라고 한 것 중 진짜 불량은?&amp;rdquo;&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;Recall&lt;/td&gt;
&lt;td&gt;&amp;ldquo;진짜 불량을 얼마나 놓치지 않았나?&amp;rdquo;&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;F1&lt;/td&gt;
&lt;td&gt;&amp;ldquo;Precision + Recall 균형은?&amp;rdquo;&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;AUC&lt;/td&gt;
&lt;td&gt;&amp;ldquo;전체적으로 얼마나 잘 분리해내는가?&amp;rdquo;&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style1&quot;&gt;&lt;span style=&quot;font-family: 'Noto Serif KR';&quot;&gt;분류 문제의 본질은 &quot;맞춘 개수&quot;가 아니라 &quot;놓치면 안 되는 걸 잡아내는 능력&quot;입니다.&lt;br /&gt;&lt;/span&gt;특히 제조업이나 자동차같이 안전, 품질에 직결되는 분야라면,&lt;br /&gt;Recall과 F1, AUC는 선택이 아니라 기본입니다.&lt;/blockquote&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;</description>
      <category>Statistics/기초 통계</category>
      <category>accuracy</category>
      <category>AUC</category>
      <category>F1</category>
      <category>Precision</category>
      <category>recall</category>
      <category>roc</category>
      <category>데이터분석</category>
      <category>데이터사이언스</category>
      <category>분류모델</category>
      <category>통계</category>
      <author>Allen93</author>
      <guid isPermaLink="true">https://allensdatablog.tistory.com/479</guid>
      <comments>https://allensdatablog.tistory.com/entry/23-%EB%B6%84%EB%A5%98-%EB%AA%A8%EB%8D%B8-%ED%8F%89%EA%B0%80-%EC%A7%80%ED%91%9C-Accuracy%EB%A7%8C-%EB%B3%B4%EB%A9%B4-%ED%81%B0%EC%9D%BC-%EB%82%98%EB%8A%94-%EC%9D%B4%EC%9C%A0#entry479comment</comments>
      <pubDate>Mon, 9 Feb 2026 12:00:50 +0900</pubDate>
    </item>
    <item>
      <title>22. 로지스틱 회귀 해석 - 오즈, 로그오즈, 오즈비를 한 번에 이해하기</title>
      <link>https://allensdatablog.tistory.com/entry/22-%EB%A1%9C%EC%A7%80%EC%8A%A4%ED%8B%B1-%ED%9A%8C%EA%B7%80-%ED%95%B4%EC%84%9D-%EC%98%A4%EC%A6%88-%EB%A1%9C%EA%B7%B8%EC%98%A4%EC%A6%88-%EC%98%A4%EC%A6%88%EB%B9%84%EB%A5%BC-%ED%95%9C-%EB%B2%88%EC%97%90-%EC%9D%B4%ED%95%B4%ED%95%98%EA%B8%B0</link>
      <description>&lt;p data-ke-size=&quot;size16&quot;&gt;로지스틱 회귀를 처음 배우면 가장 헷갈리는 부분이 바로&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;오즈(Odds), 로그오즈(Log-odds), 오즈비&lt;/b&gt;입니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이 세 단어가 갑자기 등장하면서&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&quot;아니... 왜 확률 하나 예측하는데 이렇게 복잡하지?&quot;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;라는 생각이 들 수 있어요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;하지만 이걸 한 번 제대로 이해하면&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;제조업의 &lt;b&gt;불량 검출,&lt;/b&gt;&lt;/li&gt;
&lt;li&gt;자동차 &lt;b&gt;고장 확률 예측,&lt;/b&gt;&lt;/li&gt;
&lt;li&gt;금융 부도 &lt;b&gt;예측,&lt;/b&gt;&lt;/li&gt;
&lt;li&gt;병원 &lt;b&gt;질병 여부 예측&lt;/b&gt;&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이런 모든 '0/1 분류 문제'를 직관적으로 해석할 수 있게 됩니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이번 글에서는 수식은 최소한으로 두고,&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;확률이 아니라 '가능성의 비율'을 본다는 게 무엇인지&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;확실하게 이해할 수 있도록 차근차근 풀어보겠습니다.&lt;/p&gt;
&lt;p&gt;&lt;figure class=&quot;imageblock alignCenter&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;1024&quot; data-origin-height=&quot;1024&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/bJSsdf/dJMcadNTD2a/yyh5luHkNAHS1oybJNPaYK/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/bJSsdf/dJMcadNTD2a/yyh5luHkNAHS1oybJNPaYK/img.png&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/bJSsdf/dJMcadNTD2a/yyh5luHkNAHS1oybJNPaYK/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2FbJSsdf%2FdJMcadNTD2a%2Fyyh5luHkNAHS1oybJNPaYK%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;593&quot; height=&quot;593&quot; data-origin-width=&quot;1024&quot; data-origin-height=&quot;1024&quot;/&gt;&lt;/span&gt;&lt;/figure&gt;
&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;1. 확률(p)만 가지고는 분류를 설명하기가 어렵다?&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;로지스틱 회귀는 결국 &quot;1이 될 확률(p)&quot;을 예측합니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;예를 들어 자동차 제조업에서&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;센서 온도를 보고 &lt;b&gt;부품이 고장날 확률&lt;/b&gt;을 예측한다고 해볼게요.&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;센서 온도 낮음 -&amp;gt; p = 0.02&lt;/li&gt;
&lt;li&gt;센서 온도 높음 -&amp;gt; p = 0.20&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;두 값만 보면 그냥&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&quot;20%가 더 높네&quot; 정도밖에 설명이 안 됩니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;그런데 여기서 중요한 질문이 생깁니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;&quot;이 부품은 고장날 가능성이 얼마나 더 큰가?&quot;&lt;/blockquote&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;확률로는 이 질문을 정확히 표현하기 어렵습니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;왜냐면 확률은 0~1 사이에 갇혀 있고,&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;비율을 만드는 순간 왜곡이 생기기 때문이에요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;그래서 등장한 개념이 오즈(Odds)입니다.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;2. 오즈(Odds) - '1일 가능성' vs '0일 가능성'의 비율&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;오즈는 아주 간단합니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p&gt;&lt;figure class=&quot;imageblock alignLeft&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;124&quot; data-origin-height=&quot;75&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/boUDES/dJMcadG8vFs/04yzcq42UHDCaFIQNyT07K/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/boUDES/dJMcadG8vFs/04yzcq42UHDCaFIQNyT07K/img.png&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/boUDES/dJMcadG8vFs/04yzcq42UHDCaFIQNyT07K/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2FboUDES%2FdJMcadG8vFs%2F04yzcq42UHDCaFIQNyT07K%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;124&quot; height=&quot;75&quot; data-origin-width=&quot;124&quot; data-origin-height=&quot;75&quot;/&gt;&lt;/span&gt;&lt;/figure&gt;
&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;즉,&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;&quot;1이 될 확률&quot;을 &quot;0이 될 확률&quot;로 나눈 값입니다.&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;예시로 볼게요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt; ● p = 0.2 (20% 고장 날 확률)&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p&gt;&lt;figure class=&quot;imageblock alignLeft&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;161&quot; data-origin-height=&quot;62&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/utjBM/dJMcagw8yVl/AcXlrZTtWMFy9kz3lnH5aK/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/utjBM/dJMcagw8yVl/AcXlrZTtWMFy9kz3lnH5aK/img.png&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/utjBM/dJMcagw8yVl/AcXlrZTtWMFy9kz3lnH5aK/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2FutjBM%2FdJMcagw8yVl%2FAcXlrZTtWMFy9kz3lnH5aK%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;161&quot; height=&quot;62&quot; data-origin-width=&quot;161&quot; data-origin-height=&quot;62&quot;/&gt;&lt;/span&gt;&lt;/figure&gt;
&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이건&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;&quot;고장 1번 날 동안 정상 4번 난다(1:4)&quot;&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;라는 의미입니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt; ● p = 0.5&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p&gt;&lt;figure class=&quot;imageblock alignLeft&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;135&quot; data-origin-height=&quot;63&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/b8ZCXY/dJMcac9iBNu/CG90WJTbPekaasuN3dpno0/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/b8ZCXY/dJMcac9iBNu/CG90WJTbPekaasuN3dpno0/img.png&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/b8ZCXY/dJMcac9iBNu/CG90WJTbPekaasuN3dpno0/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2Fb8ZCXY%2FdJMcac9iBNu%2FCG90WJTbPekaasuN3dpno0%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;135&quot; height=&quot;63&quot; data-origin-width=&quot;135&quot; data-origin-height=&quot;63&quot;/&gt;&lt;/span&gt;&lt;/figure&gt;
&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&quot;고장과 정상의 가능성이 동일하다 (1:1)&quot;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;라는 뜻이죠.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;● p = 0.8&lt;/b&gt;&lt;/p&gt;
&lt;p&gt;&lt;figure class=&quot;imageblock alignLeft&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;141&quot; data-origin-height=&quot;60&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/0bpD0/dJMcad1qRSs/TpuqfovQ1tn7a67QrKkvT0/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/0bpD0/dJMcad1qRSs/TpuqfovQ1tn7a67QrKkvT0/img.png&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/0bpD0/dJMcad1qRSs/TpuqfovQ1tn7a67QrKkvT0/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2F0bpD0%2FdJMcad1qRSs%2FTpuqfovQ1tn7a67QrKkvT0%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;141&quot; height=&quot;60&quot; data-origin-width=&quot;141&quot; data-origin-height=&quot;60&quot;/&gt;&lt;/span&gt;&lt;/figure&gt;
&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&quot;고장이 정상보다 4배 더 가능성이 높다&quot;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;라는 뜻입니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이제 보이죠?&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;확률은 0~1&lt;/li&gt;
&lt;li&gt;오즈는 0~ &amp;infin; (비율)&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;오즈는 '몇 배 더 가능성 높은가'를 표현하기 딱 좋은 단위&lt;/b&gt;입니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;그래서 로지스틱 회귀에서는 확률 대신&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;오즈의 세계에서 작업합니다.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;3. 로그오즈(Log-odds) - 오즈를 '직선으로' 만들기 위한 장치&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;문제는... 오즈는 곱셈의 세계라는 점입니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;그러면 회귀분석에서 직선(&amp;beta;₀ + &amp;beta;₁x)으로 표현하기가 어렵습니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;그래서 오즈에 &lt;b&gt;로그(log)&lt;/b&gt;를 씌웁니다.&lt;/p&gt;
&lt;p&gt;&lt;figure class=&quot;imageblock alignLeft&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;95&quot; data-origin-height=&quot;64&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/bbdkls/dJMcabbwRaL/ELFgGobXlfMHMGwXhRHGXk/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/bbdkls/dJMcabbwRaL/ELFgGobXlfMHMGwXhRHGXk/img.png&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/bbdkls/dJMcabbwRaL/ELFgGobXlfMHMGwXhRHGXk/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2Fbbdkls%2FdJMcabbwRaL%2FELFgGobXlfMHMGwXhRHGXk%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;95&quot; height=&quot;64&quot; data-origin-width=&quot;95&quot; data-origin-height=&quot;64&quot;/&gt;&lt;/span&gt;&lt;/figure&gt;
&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이걸 로그오즈 또는 로짓(Logi)이라고 부릅니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;로그를 쓰면:&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;곱셈 -&amp;gt; 덧셈&lt;/li&gt;
&lt;li&gt;비율 -&amp;gt; 직선&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;즉,&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;오즈의 세계를 &quot;직선 모델&quot;로 끌어올 수 있게 되는 것&lt;/b&gt;입니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;그래서 로지스틱 회귀식은 이렇게 생겼습니다:&lt;/p&gt;
&lt;p&gt;&lt;figure class=&quot;imageblock alignLeft&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;198&quot; data-origin-height=&quot;67&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/Lp3Je/dJMcaacCuYd/7YgebKOJCVlgfFw8Q3C1P0/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/Lp3Je/dJMcaacCuYd/7YgebKOJCVlgfFw8Q3C1P0/img.png&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/Lp3Je/dJMcaacCuYd/7YgebKOJCVlgfFw8Q3C1P0/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2FLp3Je%2FdJMcaacCuYd%2F7YgebKOJCVlgfFw8Q3C1P0%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;198&quot; height=&quot;67&quot; data-origin-width=&quot;198&quot; data-origin-height=&quot;67&quot;/&gt;&lt;/span&gt;&lt;/figure&gt;
&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;4. 오즈비(Odds Ratio) - 로지스틱 회귀 해석의 핵심&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;로지스틱 회귀에서 가장 중요한 것은 바로 오즈비입니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p&gt;&lt;figure class=&quot;imageblock alignLeft&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;124&quot; data-origin-height=&quot;42&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/ckJx8C/dJMcafLLyyW/KoGVq9k9spJE8gH3UDhn91/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/ckJx8C/dJMcafLLyyW/KoGVq9k9spJE8gH3UDhn91/img.png&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/ckJx8C/dJMcafLLyyW/KoGVq9k9spJE8gH3UDhn91/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2FckJx8C%2FdJMcafLLyyW%2FKoGVq9k9spJE8gH3UDhn91%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;124&quot; height=&quot;42&quot; data-origin-width=&quot;124&quot; data-origin-height=&quot;42&quot;/&gt;&lt;/span&gt;&lt;/figure&gt;
&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이 한 줄만 알면,&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;로지스틱 회귀를 해석할 때 90%는 다 이해했다고 볼 수 있어요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;예를 들어&lt;/p&gt;
&lt;p style=&quot;text-align: center;&quot; data-ke-size=&quot;size18&quot;&gt;&lt;b&gt; &lt;span&gt;&lt;span&gt;&lt;span&gt;&amp;beta;&lt;/span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;1&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span&gt;​&lt;/span&gt;&lt;/span&gt;&lt;span&gt;&lt;span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span&gt;=&lt;/span&gt;&lt;/span&gt;&lt;span&gt;&lt;span&gt;0.7&lt;/span&gt;&lt;/span&gt; &lt;/b&gt;&lt;/p&gt;
&lt;p style=&quot;text-align: center;&quot; data-ke-size=&quot;size18&quot;&gt;&lt;b&gt; &lt;span&gt;&lt;span&gt;&lt;span&gt;e^&lt;/span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;0.7&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span&gt;&amp;asymp;&lt;/span&gt;&lt;/span&gt;&lt;span&gt;&lt;span&gt;2.01&lt;/span&gt;&lt;/span&gt; &lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;span&gt;&lt;span&gt;즉,&lt;/span&gt;&lt;/span&gt;&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;X가 1 증가하면 &quot;1이 될 가능성(오즈)&quot;이 약 2배 증가한다.&lt;/blockquote&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;span&gt;&lt;span&gt;부품 고장 예시로 보면:&lt;/span&gt;&lt;/span&gt;&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;센서 온도가 1도 높아질 때&lt;/li&gt;
&lt;li&gt;고장날 가능성이 2배 증가&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;span&gt;&lt;span&gt;이렇게 해석할 수 있습니다.&lt;/span&gt;&lt;/span&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;&lt;span&gt;&lt;span&gt;아주 직관적이죠.&lt;/span&gt;&lt;/span&gt;&lt;/b&gt;&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h2 data-ke-size=&quot;size26&quot;&gt;&lt;span&gt;&lt;span&gt;5. 제조업 예시로 한 번에 정리해보자&lt;/span&gt;&lt;/span&gt;&lt;/h2&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;span&gt;&lt;span&gt;부품 온도(X)가 고장 여부(Y=1)에 영향을 준다고 합시다.&lt;/span&gt;&lt;/span&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;span&gt;&lt;span&gt;로지스틱 회귀 결과가 이렇게 나왔어요:&lt;/span&gt;&lt;/span&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;변수&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 계수 &amp;beta;&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;오즈비(e^&amp;beta;)&amp;nbsp; &amp;nbsp;의미&lt;/b&gt;&lt;/p&gt;
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody&gt;
&lt;tr&gt;
&lt;td&gt;온도&lt;/td&gt;
&lt;td&gt;0.5&lt;/td&gt;
&lt;td&gt;1.65&lt;/td&gt;
&lt;td&gt;온도 1도 증가 &amp;rarr; 고장 가능성 1.65배 증가&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;예를 들어:&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;온도 50도 -&amp;gt; 오즈 = 0.2&lt;/li&gt;
&lt;li&gt;온도 51도 -&amp;gt; 오즈 = 0.33&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;고장 확률이 0.2에서 0.33으로&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;절대값으로 보면 조금 올라간 것 같지만,&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&quot;가능성 비율&quot;로 보면&lt;b&gt; 1.65배 증가&lt;/b&gt;입니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이 차이가 정말 중요합니다.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;6. 단순히 &quot;확률이 증가한다&quot;가 아니라 &quot;가능성이 몇 배 증가하는가&quot;를 말하는 모델&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이게 로지스틱 회귀의 본질입니다.&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;확률은 절대적 크기&lt;/li&gt;
&lt;li&gt;오즈는 상대적 가능성&lt;/li&gt;
&lt;li&gt;오즈비는 변화의 배율&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;그리고 모델은 log-odds를 직선 형태로 다루기 때문에&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;해석도 깔끔하고 계산도 간단해집니다.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;7. 한 장 요약&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;개념&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;의미&lt;/b&gt;&lt;/p&gt;
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody&gt;
&lt;tr&gt;
&lt;td&gt;확률(p)&lt;/td&gt;
&lt;td&gt;1이 될 절대적 비율&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;오즈(p/(1-p))&lt;/td&gt;
&lt;td&gt;1:0 가능성의 비율&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;로그오즈&lt;/td&gt;
&lt;td&gt;오즈를 직선화한 값&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;오즈비&lt;/td&gt;
&lt;td&gt;X가 1 증가할 때 오즈가 몇 배 변하는가&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;</description>
      <category>Statistics/기초 통계</category>
      <category>Ai</category>
      <category>log-odds</category>
      <category>ODDS</category>
      <category>데이터분석</category>
      <category>데이터사이언스</category>
      <category>오즈</category>
      <category>오즈비</category>
      <category>통계</category>
      <category>회귀</category>
      <author>Allen93</author>
      <guid isPermaLink="true">https://allensdatablog.tistory.com/478</guid>
      <comments>https://allensdatablog.tistory.com/entry/22-%EB%A1%9C%EC%A7%80%EC%8A%A4%ED%8B%B1-%ED%9A%8C%EA%B7%80-%ED%95%B4%EC%84%9D-%EC%98%A4%EC%A6%88-%EB%A1%9C%EA%B7%B8%EC%98%A4%EC%A6%88-%EC%98%A4%EC%A6%88%EB%B9%84%EB%A5%BC-%ED%95%9C-%EB%B2%88%EC%97%90-%EC%9D%B4%ED%95%B4%ED%95%98%EA%B8%B0#entry478comment</comments>
      <pubDate>Fri, 6 Feb 2026 09:40:05 +0900</pubDate>
    </item>
    <item>
      <title>21. 단순선형회귀 vs 로지스틱 회귀 - 예측과 분류의 갈림길</title>
      <link>https://allensdatablog.tistory.com/entry/21-%EB%8B%A8%EC%88%9C%EC%84%A0%ED%98%95%ED%9A%8C%EA%B7%80-vs-%EB%A1%9C%EC%A7%80%EC%8A%A4%ED%8B%B1-%ED%9A%8C%EA%B7%80-%EC%98%88%EC%B8%A1%EA%B3%BC-%EB%B6%84%EB%A5%98%EC%9D%98-%EA%B0%88%EB%A6%BC%EA%B8%B8</link>
      <description>&lt;h3 data-ke-size=&quot;size23&quot;&gt;1. 둘의 목적부터 완전히 다르다&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;데이터 분석에서 가장 먼저 판단해야 하는 건 &quot;Y가 어떤 종류의 값인가?&quot;입니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;모델&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;종속변수(Y)의 형태&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 목적&lt;/b&gt;&lt;/p&gt;
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody&gt;
&lt;tr&gt;
&lt;td&gt;&lt;b&gt;단순선형회귀&lt;/b&gt;&lt;/td&gt;
&lt;td&gt;연속형 (숫자)&lt;/td&gt;
&lt;td&gt;값을 예측&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;&lt;b&gt;로지스틱 회귀&lt;/b&gt;&lt;/td&gt;
&lt;td&gt;범주형 (0/1)&lt;/td&gt;
&lt;td&gt;확률&amp;middot;분류&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;예를 들어 자동차 제조업에서 보면:&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&lt;b&gt;단순선형회귀가 필요한 상황&lt;/b&gt;&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;차량 무게로 &lt;b&gt;연비를 예측&lt;/b&gt;&lt;/li&gt;
&lt;li&gt;엔진 성능으로 &lt;b&gt;제동거리 예측&lt;/b&gt;&lt;/li&gt;
&lt;li&gt;타이어 공기압으로 &lt;b&gt;마모도 수명 예측&lt;/b&gt;&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&lt;b&gt;로지스틱 회귀가 필요한 상황&lt;/b&gt;&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;센서 값으로 이 부품이 &lt;b&gt;고장(1) / 정상(0)&lt;/b&gt;인지&lt;/li&gt;
&lt;li&gt;품질검사 데이터로 제품이 &lt;b&gt;합격(1) / 불합격(0)&lt;/b&gt;인지&lt;/li&gt;
&lt;li&gt;자율주행 상황에서 객체를 &lt;b&gt;탐지(1) / 미탐지(0)&lt;/b&gt;할지&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이렇게 목적부터 완전히 달라서 모델 구조도 달라집니다.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;2. 단순선형회귀: &quot;직선 하나로 설명하자&quot;&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;단순회귀는 아주 단순합니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;y&lt;/span&gt;&lt;/span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;^&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span&gt;​&lt;/span&gt;&lt;/span&gt;&lt;span&gt;&lt;span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span&gt;=&lt;/span&gt;&lt;/span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&amp;beta;&lt;/span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;0&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span&gt;​&lt;/span&gt;&lt;/span&gt;&lt;span&gt;&lt;span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span&gt;+&lt;/span&gt;&lt;/span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&amp;beta;&lt;/span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;1&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span&gt;​&lt;/span&gt;&lt;/span&gt;&lt;span&gt;&lt;span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span&gt;x&lt;/span&gt;&lt;/span&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;입력 X가 1만큼 늘면 Y가 &amp;beta;₁ 만큼 늘거나 줄죠.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;그래프도 &quot;직선&quot;입니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&lt;b&gt;제조업 예시&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;차량 무게 -&amp;gt; 연비 모델에서&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;X: 차량 무게(kg)&lt;/li&gt;
&lt;li&gt;Y: 연비(km/L)&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;회귀선은 점들의 흐름을 따라 직선 하나를 긋는 방식입니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&lt;b&gt;한계도 명확합니다&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;직선은 세상을 부드럽게 설명하긴 좋지만,&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;Y가 0~1 범위를 벗어나면 안 되는 문제&lt;/b&gt;에는 맞지 않습니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;예를 들어 &quot;고장 확률&quot;은 절대 120% 또는 -40%가 될 수 없죠.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;그래서 등장한 모델이 로지스틱 회귀입니다.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;3. 로지스틱 회귀 : &quot;확률을 예측하는 모델&quot;&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;로지스틱 회귀는 식부터 다릅니다.&lt;/p&gt;
&lt;p&gt;&lt;figure class=&quot;imageblock alignLeft&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;272&quot; data-origin-height=&quot;58&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/lIdWp/dJMcafydXSV/heAZ232AlNHEJs0CMDgLbK/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/lIdWp/dJMcafydXSV/heAZ232AlNHEJs0CMDgLbK/img.png&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/lIdWp/dJMcafydXSV/heAZ232AlNHEJs0CMDgLbK/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2FlIdWp%2FdJMcafydXSV%2FheAZ232AlNHEJs0CMDgLbK%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;272&quot; height=&quot;58&quot; data-origin-width=&quot;272&quot; data-origin-height=&quot;58&quot;/&gt;&lt;/span&gt;&lt;/figure&gt;
&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;여기서 p는 '1일 확률'입니다.&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;0보다 작아지지도 않고&lt;/li&gt;
&lt;li&gt;1보다 커지지도 않습니다&lt;/li&gt;
&lt;li&gt;S자(Sigmoid) 곡선이 됩니다&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&lt;b&gt;제조업 예시&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&quot;이 부품이 고장 날 확률을 예측하라.&quot;&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;X: 센서 온도&lt;/li&gt;
&lt;li&gt;Y: 고장 여부 (1 = 고장, 0 = 정상)&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;센서 온도가 올라갈수록&amp;nbsp; S-곡선을 따라 고장 확률이 올라갑니다.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;4. 왜 굳이 Sigmoid(시그모이드)인가?&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;간단하게 말하면,&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;&quot;확률은 0~1 사이여야 하니까.&quot;&lt;/blockquote&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;선형 회귀는 직선이라 계속 뻗어나가기 때문에&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;확률을 예측하기엔 구조적으로 맞지 않습니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;반면 로지스틱은&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;X가 매우 낮으면 p &amp;asymp; 0&lt;/li&gt;
&lt;li data-end=&quot;1589&quot; data-start=&quot;1570&quot;&gt;X가 매우 높으면 p &amp;asymp; 1&lt;/li&gt;
&lt;li&gt;중간 구간에서 변화가 급격&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이런 &quot;현실적인 확률 패턴&quot;을 만들어줍니다.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;5. 계수 해석의 차이&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&lt;b&gt;단순선형회귀의 계수 &amp;beta;₁ &lt;/b&gt;&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;X가 1 증가할 때, Y가 &amp;beta;₁만큼 증가/감소한다. &lt;/blockquote&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;예 : 차량 무게 100kg 증가 -&amp;gt; 연비 0.5km/L 감소&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&lt;b&gt;로지스틱 회귀의 계수 &amp;beta;₁ &lt;/b&gt;&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;X가 1 증가할 때, &lt;b&gt;log-odds(로그 오즈)&lt;/b&gt;가 &amp;beta;₁만큼 증가한다.&lt;/blockquote&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;잠깐, log-odds가 뭐냐면:&lt;/p&gt;
&lt;p&gt;&lt;figure class=&quot;imageblock alignLeft&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;99&quot; data-origin-height=&quot;67&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/b2peQW/dJMcahJzQnE/RuQQjvEYH5Xa0kssnPGGGK/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/b2peQW/dJMcahJzQnE/RuQQjvEYH5Xa0kssnPGGGK/img.png&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/b2peQW/dJMcahJzQnE/RuQQjvEYH5Xa0kssnPGGGK/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2Fb2peQW%2FdJMcahJzQnE%2FRuQQjvEYH5Xa0kssnPGGGK%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;99&quot; height=&quot;67&quot; data-origin-width=&quot;99&quot; data-origin-height=&quot;67&quot;/&gt;&lt;/span&gt;&lt;/figure&gt;
&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;즉, 확률 p 자체가 아니고&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&quot;1일 가능성 대비 0일 가능성의 비율&quot;입니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이 개념이 어렵게 느껴지기 때문에&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;실무에서는 보통 &lt;b&gt;오즈비(Odds ratio)&lt;/b&gt;로 해석합니다.&lt;/p&gt;
&lt;p&gt;&lt;figure class=&quot;imageblock alignLeft&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;106&quot; data-origin-height=&quot;42&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/cFLCLz/dJMcahv2vQI/5a5YKU0SeFK2QKDggxvsD0/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/cFLCLz/dJMcahv2vQI/5a5YKU0SeFK2QKDggxvsD0/img.png&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/cFLCLz/dJMcahv2vQI/5a5YKU0SeFK2QKDggxvsD0/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2FcFLCLz%2FdJMcahv2vQI%2F5a5YKU0SeFK2QKDggxvsD0%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;106&quot; height=&quot;42&quot; data-origin-width=&quot;106&quot; data-origin-height=&quot;42&quot;/&gt;&lt;/span&gt;&lt;/figure&gt;
&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;예를 들어 e⁰&amp;middot;⁷ = 약 2.0이면&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;X가 1 증가할 때 &lt;b&gt;고장 가능성이 2배&lt;/b&gt;가 된다는 의미입니다.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;6. 그래프로 보면 차이가 더 명확해진다&lt;/h3&gt;
&lt;p&gt;&lt;figure class=&quot;imageblock alignCenter&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;1024&quot; data-origin-height=&quot;1024&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/coTTOF/dJMcab3E4V1/RyEhJx4iJ1xCW1kyOKNX51/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/coTTOF/dJMcab3E4V1/RyEhJx4iJ1xCW1kyOKNX51/img.png&quot; data-alt=&quot;단순선형회귀-로지스틱회귀&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/coTTOF/dJMcab3E4V1/RyEhJx4iJ1xCW1kyOKNX51/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2FcoTTOF%2FdJMcab3E4V1%2FRyEhJx4iJ1xCW1kyOKNX51%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;659&quot; height=&quot;659&quot; data-origin-width=&quot;1024&quot; data-origin-height=&quot;1024&quot;/&gt;&lt;/span&gt;&lt;figcaption&gt;단순선형회귀-로지스틱회귀&lt;/figcaption&gt;
&lt;/figure&gt;
&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&lt;b&gt;단순회귀 그래프&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;점들의 흐름을 직선으로 관통&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;-&amp;gt; 예측값이 -&amp;infin; ~ +&amp;infin; 가능&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;-&amp;gt; &quot;숫자 예측&quot;에 적합&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&lt;b&gt;로지스틱 회귀 그래프&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;S자 곡선&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;-&amp;gt; 예측값이 0~1 확률&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;-&amp;gt; &quot;분류&quot; 또는 &quot;예/아니요&quot; 문제에 적합&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;7. 제조업 예시로 한 번에 정리&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;문제&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; Y형태&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;적합 모델&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 이유&lt;/b&gt;&lt;/p&gt;
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody&gt;
&lt;tr&gt;
&lt;td&gt;연비 예측&lt;/td&gt;
&lt;td&gt;숫자(연속)&lt;/td&gt;
&lt;td&gt;단순회귀&lt;/td&gt;
&lt;td&gt;직선으로 예측 가능&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;제동거리 예측&lt;/td&gt;
&lt;td&gt;숫자(연속)&lt;/td&gt;
&lt;td&gt;단순회귀&lt;/td&gt;
&lt;td&gt;예측값 제한 없음&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;고장 여부(0/1)&lt;/td&gt;
&lt;td&gt;범주형(이진)&lt;/td&gt;
&lt;td&gt;로지스틱&lt;/td&gt;
&lt;td&gt;확률 모델 필요&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;품질 불량(0/1)&lt;/td&gt;
&lt;td&gt;범주형&lt;/td&gt;
&lt;td&gt;로지스틱&lt;/td&gt;
&lt;td&gt;시그모이드 구조&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;8. 한 장 요약&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;구분&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;단순회귀&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;로지스틱 회귀&lt;/b&gt;&lt;/p&gt;
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody&gt;
&lt;tr&gt;
&lt;td&gt;목적&lt;/td&gt;
&lt;td&gt;수치 예측&lt;/td&gt;
&lt;td&gt;분류(확률 예측)&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;Y&lt;/td&gt;
&lt;td&gt;연속형&lt;/td&gt;
&lt;td&gt;이진&amp;middot;범주&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;형태&lt;/td&gt;
&lt;td&gt;직선&lt;/td&gt;
&lt;td&gt;S형 곡선&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;예측값 범위&lt;/td&gt;
&lt;td&gt;제한 없음&lt;/td&gt;
&lt;td&gt;0~1 확률&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;해석&lt;/td&gt;
&lt;td&gt;기울기 중심&lt;/td&gt;
&lt;td&gt;오즈비 중심&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;9. 마무리&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;&quot;단순회귀는 숫자를 예측하는 모델,&lt;br /&gt;로지스틱은 확률과 분류를 예측하는 모델.&quot;&lt;/blockquote&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;두 모델은 수식 구조만 다르지&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;결국 'X가 Y에 어떤 영향을 주는가'를 설명하는 방식이라는 점에서 같습니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;</description>
      <category>Statistics/기초 통계</category>
      <category>단순회귀</category>
      <category>데이터분석</category>
      <category>데이터사이언스</category>
      <category>로지스틱회귀</category>
      <category>모델</category>
      <category>분류</category>
      <category>예측</category>
      <category>오즈비</category>
      <category>통계</category>
      <author>Allen93</author>
      <guid isPermaLink="true">https://allensdatablog.tistory.com/477</guid>
      <comments>https://allensdatablog.tistory.com/entry/21-%EB%8B%A8%EC%88%9C%EC%84%A0%ED%98%95%ED%9A%8C%EA%B7%80-vs-%EB%A1%9C%EC%A7%80%EC%8A%A4%ED%8B%B1-%ED%9A%8C%EA%B7%80-%EC%98%88%EC%B8%A1%EA%B3%BC-%EB%B6%84%EB%A5%98%EC%9D%98-%EA%B0%88%EB%A6%BC%EA%B8%B8#entry477comment</comments>
      <pubDate>Tue, 3 Feb 2026 09:25:10 +0900</pubDate>
    </item>
    <item>
      <title>20. 변수 선택과 모델링 전략 - &amp;quot;어떤 변수를 넣고 뺄 것인가?&amp;quot;</title>
      <link>https://allensdatablog.tistory.com/entry/20-%EB%B3%80%EC%88%98-%EC%84%A0%ED%83%9D%EA%B3%BC-%EB%AA%A8%EB%8D%B8%EB%A7%81-%EC%A0%84%EB%9E%B5-%EC%96%B4%EB%96%A4-%EB%B3%80%EC%88%98%EB%A5%BC-%EB%84%A3%EA%B3%A0-%EB%BA%84-%EA%B2%83%EC%9D%B8%EA%B0%80</link>
      <description>&lt;p&gt;&lt;figure class=&quot;imageblock alignCenter&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;1024&quot; data-origin-height=&quot;1024&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/bRvpbv/dJMcacVNoxJ/h9PkJbaeAOvrSTvdHgF2P0/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/bRvpbv/dJMcacVNoxJ/h9PkJbaeAOvrSTvdHgF2P0/img.png&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/bRvpbv/dJMcacVNoxJ/h9PkJbaeAOvrSTvdHgF2P0/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2FbRvpbv%2FdJMcacVNoxJ%2Fh9PkJbaeAOvrSTvdHgF2P0%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;522&quot; height=&quot;522&quot; data-origin-width=&quot;1024&quot; data-origin-height=&quot;1024&quot;/&gt;&lt;/span&gt;&lt;/figure&gt;
&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;회귀를 조금만 해보면 누구나 이런 고민을 합니다.&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;&quot;변수가 너무 많은데.. 어떤 걸 써야 하지?&quot;&lt;br /&gt;&quot;빼면 정보가 손실될 것 같고, 넣으면 공선성이 생기고...&quot;&lt;br /&gt;&quot;결국 좋은 모델은 어떻게 만드는 걸까?&quot;&lt;/blockquote&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;실제로 제조업(자동차 포함) 데이터에서는 변수들이 많고 서로 연결되어 있어서&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&quot;무엇을 넣고 빼는가&quot;가 모델의 품질을 거의 결정합니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이번 글에서는 그 기준을 &lt;b&gt;간단하고 직관적&lt;/b&gt;으로 정리해 보겠습니다.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;1. 모든 변수를 넣는 것이 답은 아니다&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;데이터를 처음 다룰 때 흔히 하는 실수가 있습니다.&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;&quot;많이 넣으면 더 정확한 모델이 되겠지, &quot;&lt;/blockquote&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;하지만 현실은 그 반대입니다.&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;데이터는 늘 표본 오차를 가지고 있고&lt;/li&gt;
&lt;li&gt;변수는 서로 연관되어 있으며&lt;/li&gt;
&lt;li&gt;불필요한 변수는 노이즈를 늘려&lt;/li&gt;
&lt;li&gt;&lt;b&gt;해석 불가능한 모델&lt;/b&gt;을 만들어냅니다.&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;모델은 단순할수록 좋습니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;마치 자동차 부품이 적을수록 고장이 덜 나는 것처럼요.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;2. 좋은 모델의 기본 원칙 3가지&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&lt;b&gt;원칙 1: 변수가 '의미 있는 정보'를 가지고 있어야 한다&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;예를 들어 자동차 연비 모델에서:&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;차량 무게 -&amp;gt; 의미 있음&lt;/li&gt;
&lt;li&gt;엔진 배기량 -&amp;gt; 의미 있음&lt;/li&gt;
&lt;li&gt;차량 색상 -&amp;gt; 의미 없음&lt;/li&gt;
&lt;li&gt;제조 공장 이름 -&amp;gt; 의미 없음&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;데이터가 있다고 모두 넣는 것이 아니라&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&quot;Y를 설명할만한 이유&quot;가 있는 변수만 넣어야 합니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&lt;b&gt;원칙 2: 변수들끼리 역할이 겹치면 위험하다&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이게 바로 앞 글에서 다룬 &lt;b&gt;다중공선성&lt;/b&gt; 문제입니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;예시 :&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;배기량, 마력, 토크&lt;/li&gt;
&lt;li&gt;차급(class), 전장, 전폭&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이런 구성은 서로 비슷한 정보를 제공하기 때문에&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;모델이 &quot;누가 진짜 영향인지&quot; 판단하지 못합니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;겹치는 건 &lt;b&gt;하나만 남기거나, 조합&lt;/b&gt;하는 게 좋습니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&lt;b&gt;원칙 3: 해석 가능한 변수를 선택해야 한다&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;모델의 목적이 예측이 아니라 &lt;b&gt;해석(영향 파악)&lt;/b&gt;이라면 특히 중요합니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;예를 들어&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;&quot;차량 무게가 연비에 미치는 영향(kg담 몇 km/L인지)&quot;, 이건 해석 가능하죠.&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;반면 PCA로 변수를 섞어버리면&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;예측력은 좋아도 해석이 어려워집니다.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;3. 실무에서 쓰는 변수 선택 전략&lt;/h3&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&lt;b&gt;1) 도메인 지식 기반 선택 (가장 중요)&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;자동차 엔지니어가 보기에&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&quot;연비에 영향을 줄 만한 요인&quot;을 먼저 리스트업 하는 방식입니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;예:&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;차량 무게&lt;/li&gt;
&lt;li&gt;배기량&lt;/li&gt;
&lt;li&gt;공기저항계수&lt;/li&gt;
&lt;li&gt;타이어 마찰&lt;/li&gt;
&lt;li&gt;변속기 종류&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;통계적 절차보다 먼저 &lt;b&gt;현업의 이해&lt;/b&gt;로 걸러내는 것이 가장 정확합니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&lt;b&gt;2) 상관계수(corr)로 기초 점검&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;0.7 이상이면 서로 강하게 연관된 상태로 보고&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;변수들의 &quot;카피&quot;가 있는지 확인합니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;하지만 상관계수는 한계가 있으므로&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;반드시 다음 기법도 사용해야 합니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&lt;b&gt;3) VIF로 공선성 점검&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;앞에서 말씀드린 대로,&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;VIF &amp;gt; 10이면 거의 확실하게 문제입니다.&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;VIF 높음 -&amp;gt; 변수 제거 또는 대체&lt;/li&gt;
&lt;li&gt;VIF 낮음 -&amp;gt; &quot;독립적인 정보&quot;를 준다는 의미&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&lt;b&gt;4) 모델 비교 (전진/후진/Stepwise)&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;자동화된 변수 선택 절차입니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;전진 선택 (Forward)&lt;/b&gt;&lt;br /&gt;-&amp;gt; 변수를 하나씩 추가하면서 성능이 좋아지는지 확인&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;후진 제거 (Backward)&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;-&amp;gt; 일단 모두 넣고, 영향이 작은 것부터 제거&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;Stepwise&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;-&amp;gt; 둘을 섞은 방식&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;하지만 이 방식은 &lt;b&gt;기계적으로 결정&lt;/b&gt;되기 때문에&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;반드시 &lt;b&gt;도메인 지식 + 진단 그래프&lt;/b&gt;와 함께 사용해야 합니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&lt;b&gt;5) 규제 회귀(Lasso, Ridge)&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;변수가 많거나, 공선성이 심하면&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;Lasso, Ridge 같은 규제 기법이 큰 도움이 됩니다.&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;Ridge -&amp;gt; 공선성 완화&lt;/li&gt;
&lt;li&gt;Lasso -&amp;gt; 불필요한 변수를 자동 제거&lt;/li&gt;
&lt;li&gt;Elastic Net -&amp;gt; 두 방법의 장점 결합&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;제조업 데이터처러 변수가 많은 환경에 매우 잘 맞는 방식입니다.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;4. 자동차 예시로 한 번에 이해하기&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;연비(Y)를 예측하려고 합니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;처음에는 아래 변수를 모두 넣었어요.&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;차량무게&lt;/li&gt;
&lt;li&gt;배기량&lt;/li&gt;
&lt;li&gt;마력&lt;/li&gt;
&lt;li&gt;전폭&lt;/li&gt;
&lt;li&gt;전장&lt;/li&gt;
&lt;li&gt;타이어 폭&lt;/li&gt;
&lt;li&gt;공기저항계수&lt;/li&gt;
&lt;li&gt;변속기 종류&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;모델을 돌려보니:&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;배기량, 마력, 토크(VIF 12+) -&amp;gt; 공선성&lt;/li&gt;
&lt;li&gt;전폭, 전장(VIF 8~10) -&amp;gt; 차급 정보를 중복 표현&lt;/li&gt;
&lt;li&gt;공기저항계수는 강한 유의성&lt;/li&gt;
&lt;li&gt;타이어 폭은 유의하지 않음&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;최종적으로 아래만 선택합니다.&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;차량무게&lt;/li&gt;
&lt;li&gt;공기저항계수&lt;/li&gt;
&lt;li&gt;변속기 종류&lt;/li&gt;
&lt;li&gt;배기량(마력, 토크 제외)&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이렇게 하면:&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;해석이 명확해지고&lt;/li&gt;
&lt;li&gt;공선성이 줄어들고&lt;/li&gt;
&lt;li&gt;p값이 안정적으로 나오고&lt;/li&gt;
&lt;li&gt;예측력도 오히려 좋아집니다&lt;/li&gt;
&lt;/ul&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;즉, 변수를 줄이는 것은 &quot;정보 손실&quot;이 아니라&lt;br /&gt;&lt;b&gt;&quot;모델의 품질을 개선하는 과정&quot;&lt;/b&gt;입니다.&lt;/blockquote&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;5. 한 장 요약&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;전략&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 핵심&lt;/b&gt;&lt;/p&gt;
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody&gt;
&lt;tr&gt;
&lt;td&gt;도메인 기반&lt;/td&gt;
&lt;td&gt;가장 중요, 첫 단계&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;상관계수&lt;/td&gt;
&lt;td&gt;중복 변수 탐색&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;VIF&lt;/td&gt;
&lt;td&gt;공선성 진단 도구&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;자동 선택&lt;/td&gt;
&lt;td&gt;전진&amp;middot;후진&amp;middot;Stepwise&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;규제 회귀&lt;/td&gt;
&lt;td&gt;변수 많을 때 강력&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;목표에 따라 선택&lt;/td&gt;
&lt;td&gt;해석 vs 예측용 모델 구분&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style1&quot;&gt;&lt;span style=&quot;font-family: 'Noto Serif KR';&quot;&gt;좋은 모델은 변수 100개를 넣는 게 아니라&lt;br /&gt;&lt;/span&gt;필요한 변수 몇 개를 정확히 고르는 것입니다.&quot;&lt;/blockquote&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;</description>
      <category>Statistics/기초 통계</category>
      <category>VIIF</category>
      <category>규제회귀</category>
      <category>데이터분석</category>
      <category>데이터사이언스</category>
      <category>모델</category>
      <category>변수</category>
      <category>상관계수</category>
      <category>전진</category>
      <category>통계</category>
      <category>후진</category>
      <author>Allen93</author>
      <guid isPermaLink="true">https://allensdatablog.tistory.com/476</guid>
      <comments>https://allensdatablog.tistory.com/entry/20-%EB%B3%80%EC%88%98-%EC%84%A0%ED%83%9D%EA%B3%BC-%EB%AA%A8%EB%8D%B8%EB%A7%81-%EC%A0%84%EB%9E%B5-%EC%96%B4%EB%96%A4-%EB%B3%80%EC%88%98%EB%A5%BC-%EB%84%A3%EA%B3%A0-%EB%BA%84-%EA%B2%83%EC%9D%B8%EA%B0%80#entry476comment</comments>
      <pubDate>Sat, 31 Jan 2026 10:35:28 +0900</pubDate>
    </item>
    <item>
      <title>19. 다중공선성 - 왜 변수들이 서로 닮아 있으면 문제가 될까?</title>
      <link>https://allensdatablog.tistory.com/entry/19-%EB%8B%A4%EC%A4%91%EA%B3%B5%EC%84%A0%EC%84%B1-%EC%99%9C-%EB%B3%80%EC%88%98%EB%93%A4%EC%9D%B4-%EC%84%9C%EB%A1%9C-%EB%8B%AE%EC%95%84-%EC%9E%88%EC%9C%BC%EB%A9%B4-%EB%AC%B8%EC%A0%9C%EA%B0%80-%EB%90%A0%EA%B9%8C</link>
      <description>&lt;p&gt;&lt;figure class=&quot;imageblock alignCenter&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;1024&quot; data-origin-height=&quot;1024&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/cHBcmu/dJMcahCNbCJ/MrNh2BdFKC0WhYort67mOk/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/cHBcmu/dJMcahCNbCJ/MrNh2BdFKC0WhYort67mOk/img.png&quot; data-alt=&quot;다중공선성&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/cHBcmu/dJMcahCNbCJ/MrNh2BdFKC0WhYort67mOk/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2FcHBcmu%2FdJMcahCNbCJ%2FMrNh2BdFKC0WhYort67mOk%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;591&quot; height=&quot;591&quot; data-origin-width=&quot;1024&quot; data-origin-height=&quot;1024&quot;/&gt;&lt;/span&gt;&lt;figcaption&gt;다중공선성&lt;/figcaption&gt;
&lt;/figure&gt;
&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;회귀분석은 기본적으로&lt;b&gt; &quot;한 변수의 순수한 효과&quot;&lt;/b&gt;를 보고 싶어 하는 방법입니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;그런데 현실의 데이터에서는 변수가 서로 아주 비슷하게 움직이는 경우가 많아요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;자동차 제조업 데이터를 예로 들어보겠습니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;엔진 배기량(cc)&lt;/li&gt;
&lt;li&gt;마력(hp)&lt;/li&gt;
&lt;li&gt;토크(Nm)&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이 3개는 서로 굉장히 밀접하게 묶여 있습니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;배기량이 큰 차는 마력도 높고, 토크도 높은 경향이 있죠.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이렇게 &lt;b&gt;서로 강하게 상관된 변수들&lt;/b&gt;이 동시에 회귀모델에 들어가 있으면&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;문제가 발생합니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이걸 &lt;b&gt;다중공선성(Muticollinearity)&lt;/b&gt;이라고 부릅니다.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;1. 다중공선성이 있으면 어떤 문제가 생길까?&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이건 정말 자주 질문받는 부분인데,&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;문제를 단순하게 정리하면 다음 세 가지입니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&lt;b&gt;문제 1: 회귀계수(&amp;beta;)가 불안정해진다&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;공선성이 심하면 &amp;beta;값이 &lt;b&gt;크게 흔들립니다.&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;예를 들어&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;어제는 마력이 연비에 큰 영향을 주는 것처럼 보였는데&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;오늘 데이터로 돌려보면 배기량이 더 중요한 것처럼 보이고...&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;즉,&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;&quot;해석이 흔들리기 때문에 믿을 수 없는 모델이 된다.&quot;&lt;/blockquote&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&lt;b&gt;문제 2: 계수의 부호가 이상해질 수 있다&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;실제로 가장 당황스러운 경우는 이것입니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;직관적으로는&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;배기량 &amp;uarr; &amp;rarr; 연비 &amp;darr; (음의 관계)&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;라고 알고 있는데,&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;회귀 결과가 이렇게 나올 수도 있어요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;Y^ = 25 + 03.배기량 - 0.9마력&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;배기량이 커지는데 연비가 오른다?&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;말이 안 되죠.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;그 이유는 배기량과 마력이 &lt;b&gt;너무 비슷하게 움직이기 때문&lt;/b&gt;에,&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;모델이 &quot;둘의 순수한 역할을 분리해 낼 수 없기 때문&quot;입니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&lt;b&gt;문제 3: p값이 커지고 유의성이 낮아진다&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;회귀계수의 표준오차가 커집니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;즉,&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;&quot;진짜 효과는 있는데, 통계적으로 유의하지 않은 것처럼 보이는 현상&quot;&lt;/blockquote&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이 나타내요.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style5&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;2. 왜 이런 문제가 생기는 걸까?&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;직관적으로 말하면,&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;&quot;X₁과 X₂가 거의 같은 정보라면,&lt;br /&gt;모델이 '누가 진짜 영향력을 가직 변수인지' 구분하지 못한다.&quot;&lt;/blockquote&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;예를 들어 자동차에서&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;배기량(cc)&lt;/li&gt;
&lt;li&gt;실린더 수&lt;/li&gt;
&lt;li&gt;엔진 무게&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이 세 변수가 거의 동일한 패턴으로 움직인다면,&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;회귀모델 입장에서는 &quot;누가 무엇을 설명하는지&quot; 헷갈리기 시작합니다.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;3. 다중공선성은 어떻게 진단할까?&lt;/h3&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&lt;b&gt;1) 상관계수(correlation) 확인&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;가장 간단한 방법입니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;예를 들어 0.8 이상이면 공선성을 의심합니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;하지만 이것만으로 충분하지는 않아요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;그래서 존재하는 더 중요한 지표가 있습니다.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&lt;b&gt;2) VIF(Variance Inflattion Factor)&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;공선성 진단의 표준 도구입니다.&lt;/p&gt;
&lt;p&gt;&lt;figure class=&quot;imageblock alignLeft&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;133&quot; data-origin-height=&quot;56&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/c1ZA6C/dJMcafdUc1N/y959Pc1iqX9MkBAnKbPZYK/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/c1ZA6C/dJMcafdUc1N/y959Pc1iqX9MkBAnKbPZYK/img.png&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/c1ZA6C/dJMcafdUc1N/y959Pc1iqX9MkBAnKbPZYK/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2Fc1ZA6C%2FdJMcafdUc1N%2Fy959Pc1iqX9MkBAnKbPZYK%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;133&quot; height=&quot;56&quot; data-origin-width=&quot;133&quot; data-origin-height=&quot;56&quot;/&gt;&lt;/span&gt;&lt;/figure&gt;
&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;보통 기준은 다음과 같습니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;VIF&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 해석&lt;/b&gt;&lt;/p&gt;
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody&gt;
&lt;tr&gt;
&lt;td&gt;1 ~ 5&lt;/td&gt;
&lt;td&gt;대부분 문제 없음&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;5 ~ 10&lt;/td&gt;
&lt;td&gt;공선성 의심&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;10 이상&lt;/td&gt;
&lt;td&gt;심각한 공선성&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;예를 들어 자동차 데이터에서&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;배기량의 VIF가 12가 나왔다면,&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이 변수는 다른 변수와 매우 비슷한 정보를 가진다는 뜻입니다.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;4. 해결 방법 - 실무에서 정말 자주 쓰는 방법들&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&lt;b&gt;방법 1: 강하게 연관된 변수 중 하나만 선택하기&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;예를 들어 배기량, 마력, 토크가 모두 높은 상관을 가진다면&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;한두 개만 선택하는 방법입니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;장점:&lt;/b&gt; 해석이 명확해지고 모델이 단순해짐&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;단점:&lt;/b&gt; 약간의 정보 손실&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&lt;b&gt;방법 2: 변수들을 묶어서 '지표(지수)'로 만들기&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;예를 들어&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;엔진 성능 관련 변수를 하나로 합쳐&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&quot;엔진 퍼포먼스 점수(Score)&quot;처럼 만들 수 있죠.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&lt;b&gt;방법 3: 표준화(Scaling)&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;표준화는 공선성을 해결하진 못하지만&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;계수의 해석을 안정시키는 데 도움을 줍니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&lt;b&gt;방법 4: PCA 같은 차원축소&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;변수들을 서로 독립적인 축으로 만드는 방법이죠.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&lt;b&gt;방법 5: 규제 회귀(Regularization)&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;Lasso, Ridge, Elastic Net 같은 기법을 쓰면&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;공선성이 있어도 계수가 불안정해지는 문제를 줄일 수 있습니다.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;5. 자동차 예시로 이해해 보자&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;차량 연비(Y)를 설명하기 위해 아래 변수를 넣었다고 합시다.&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;차량 무게&lt;/li&gt;
&lt;li&gt;배기량&lt;/li&gt;
&lt;li&gt;마력&lt;/li&gt;
&lt;li&gt;토크&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;결과가 이렇게 나왔다고 해봅시다:&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;변수&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 계수&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;p값&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; VIF&lt;/b&gt;&lt;/p&gt;
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody&gt;
&lt;tr&gt;
&lt;td&gt;무게&lt;/td&gt;
&lt;td&gt;-0.006&lt;/td&gt;
&lt;td&gt;0.001&lt;/td&gt;
&lt;td&gt;2.2&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;배기량&lt;/td&gt;
&lt;td&gt;-0.003&lt;/td&gt;
&lt;td&gt;0.40&lt;/td&gt;
&lt;td&gt;12.5&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;마력&lt;/td&gt;
&lt;td&gt;+0.002&lt;/td&gt;
&lt;td&gt;0.60&lt;/td&gt;
&lt;td&gt;11.8&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;토크&lt;/td&gt;
&lt;td&gt;-0.001&lt;/td&gt;
&lt;td&gt;0.52&lt;/td&gt;
&lt;td&gt;10.7&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;배기량, 마력, 토크는 CIF가 전부 10 이상&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;-&amp;gt; 서로 너무 비슷한 정보&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;계수가 불안정&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;p값도 높아서 유의하지 않음&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;해결:&lt;/b&gt;&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;배기량 하나만 남기고 나머지는 제거&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;또는&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;엔진 성능 점수(Performance Index)로 묶기&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;또는&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;Ridge 회귀 적용하기&lt;/li&gt;
&lt;/ul&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;6. 한 장 요약&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;개념&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 의미&lt;/b&gt;&lt;/p&gt;
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody&gt;
&lt;tr&gt;
&lt;td&gt;다중공선성&lt;/td&gt;
&lt;td&gt;독립변수끼리 서로 강하게 상관된 상태&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;문제점&lt;/td&gt;
&lt;td&gt;계수 불안정, 해석 불가능, p값 상승&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;진단&lt;/td&gt;
&lt;td&gt;상관계수, VIF (10 이상이면 위험)&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;해결&lt;/td&gt;
&lt;td&gt;변수 선택, 변수 조합, PCA, 규제 회귀&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style1&quot;&gt;&lt;span style=&quot;font-family: 'Noto Serif KR';&quot;&gt;공선성은 회귀모델을 헷갈리게 하고, &lt;/span&gt;해석을 흐릿하게 만든다.&lt;br /&gt;좋은 모델은 '중복된 이야기'를 줄여 스스로 명확해진다.&quot;&lt;/blockquote&gt;</description>
      <category>Statistics/기초 통계</category>
      <category>CIF</category>
      <category>PCA</category>
      <category>다중공선성</category>
      <category>데이터분석</category>
      <category>데이터사이언스</category>
      <category>독립변수</category>
      <category>변수</category>
      <category>상관계수</category>
      <category>통계</category>
      <category>회귀계수</category>
      <author>Allen93</author>
      <guid isPermaLink="true">https://allensdatablog.tistory.com/475</guid>
      <comments>https://allensdatablog.tistory.com/entry/19-%EB%8B%A4%EC%A4%91%EA%B3%B5%EC%84%A0%EC%84%B1-%EC%99%9C-%EB%B3%80%EC%88%98%EB%93%A4%EC%9D%B4-%EC%84%9C%EB%A1%9C-%EB%8B%AE%EC%95%84-%EC%9E%88%EC%9C%BC%EB%A9%B4-%EB%AC%B8%EC%A0%9C%EA%B0%80-%EB%90%A0%EA%B9%8C#entry475comment</comments>
      <pubDate>Wed, 28 Jan 2026 10:12:36 +0900</pubDate>
    </item>
    <item>
      <title>18. 최소제곱법의 직관 - 왜 '제곱'을 최소화할까?</title>
      <link>https://allensdatablog.tistory.com/entry/18-%EC%B5%9C%EC%86%8C%EC%A0%9C%EA%B3%B1%EB%B2%95%EC%9D%98-%EC%A7%81%EA%B4%80-%EC%99%9C-%EC%A0%9C%EA%B3%B1%EC%9D%84-%EC%B5%9C%EC%86%8C%ED%99%94%ED%95%A0%EA%B9%8C</link>
      <description>&lt;p&gt;&lt;figure class=&quot;imageblock alignCenter&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;1024&quot; data-origin-height=&quot;1536&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/bajTjP/dJMcaajlYDp/hZLNwCANn0QM8h4wrnlKdK/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/bajTjP/dJMcaajlYDp/hZLNwCANn0QM8h4wrnlKdK/img.png&quot; data-alt=&quot;최소제곱법&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/bajTjP/dJMcaajlYDp/hZLNwCANn0QM8h4wrnlKdK/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2FbajTjP%2FdJMcaajlYDp%2FhZLNwCANn0QM8h4wrnlKdK%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;560&quot; height=&quot;840&quot; data-origin-width=&quot;1024&quot; data-origin-height=&quot;1536&quot;/&gt;&lt;/span&gt;&lt;figcaption&gt;최소제곱법&lt;/figcaption&gt;
&lt;/figure&gt;
&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;회귀분석에서 가장 근본이 되는 원리가 &lt;b&gt;'최소제곱법(OLS, Ordinary Least Squares)'입니다.&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;우리는 이미 회귀선을 그릴 때 이런 말을 합니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;&quot;실제 데이터와 예측선 사이의 오차가 최소가 되도록 선을 찾는다.&quot;&lt;/blockquote&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;그런데 여기서 자연스럽게 떠오르는 한 가지 질문이 있죠.&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;&quot;오차를 그냥 더하면 되지, 왜 굳이 제곱을 해서 더하는 걸까?&quot;&lt;/blockquote&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;오늘은 그 이유를 아주 직관적으로,&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;그리고 제조업(특히 자동차 예시)을 활용해서 이해해 보겠습니다.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;1. 예측선과 실제 데이터의 '거리'가 오차입니다&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;회귀선을 이렇게 생겼습니다.&lt;/p&gt;
&lt;p&gt;&lt;figure class=&quot;imageblock alignLeft&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;121&quot; data-origin-height=&quot;41&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/tCRmV/dJMb99ShwXJ/lVKEPr3uLkOqkAXzKgwiFK/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/tCRmV/dJMb99ShwXJ/lVKEPr3uLkOqkAXzKgwiFK/img.png&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/tCRmV/dJMb99ShwXJ/lVKEPr3uLkOqkAXzKgwiFK/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2FtCRmV%2FdJMb99ShwXJ%2FlVKEPr3uLkOqkAXzKgwiFK%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;121&quot; height=&quot;41&quot; data-origin-width=&quot;121&quot; data-origin-height=&quot;41&quot;/&gt;&lt;/span&gt;&lt;/figure&gt;
&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;그리고 각 점마다 실제값 &lt;span&gt;&lt;span aria-hidden=&quot;true&quot;&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;y&lt;/span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;i&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span&gt;​&lt;/span&gt;&lt;/span&gt;&lt;span&gt;&lt;span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;와 예측값 y^i 사이의 차이가 만들어지죠.&lt;/p&gt;
&lt;p&gt;&lt;figure class=&quot;imageblock alignLeft&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;112&quot; data-origin-height=&quot;34&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/cCBhZv/dJMcabigeHD/aCfQPqI26BIqXPy9N8AF6k/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/cCBhZv/dJMcabigeHD/aCfQPqI26BIqXPy9N8AF6k/img.png&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/cCBhZv/dJMcabigeHD/aCfQPqI26BIqXPy9N8AF6k/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2FcCBhZv%2FdJMcabigeHD%2FaCfQPqI26BIqXPy9N8AF6k%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;112&quot; height=&quot;34&quot; data-origin-width=&quot;112&quot; data-origin-height=&quot;34&quot;/&gt;&lt;/span&gt;&lt;/figure&gt;
&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이게 &lt;b&gt;잔차(residual)&lt;/b&gt;입니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이 잔차를 가장 작게 만드는 선이 &quot;가장 잘 맞는 회귀선&quot;이에요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;하지만 문제는...&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;잔차의 '부호(+,-)' 때문에 단순히 더하면 0이 될 수 있다는 것.&lt;/blockquote&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;예를 들어 자동차 연비 데이터를 보죠.&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;어떤 점은 회귀선보다 위에 있음 -&amp;gt; 잔차 +&lt;/li&gt;
&lt;li&gt;어떤 점은 아래에 있음 -&amp;gt; 잔차 -&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이걸 그냥 더하면, 좋은 선이든 나쁜 선이든&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;서로 상쇄 되어 합이 0&lt;/b&gt; 근처가 되어버릴 수 있어요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;즉, 오차를 제대로 측정 할 수 없음.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;그래서 첫 번째 문제 해결을 위해 제곱이 등장합니다.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;2. 오차를 제곱하면 부호 문제가 해결됩니다&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;잔차를 제곱하면 이렇게 됩니다.&lt;/p&gt;
&lt;p&gt;&lt;figure class=&quot;imageblock alignLeft&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;120&quot; data-origin-height=&quot;49&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/wSC47/dJMcafrqm5D/RkpxKxax9NUUJX72GZTnyk/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/wSC47/dJMcafrqm5D/RkpxKxax9NUUJX72GZTnyk/img.png&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/wSC47/dJMcafrqm5D/RkpxKxax9NUUJX72GZTnyk/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2FwSC47%2FdJMcafrqm5D%2FRkpxKxax9NUUJX72GZTnyk%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;120&quot; height=&quot;49&quot; data-origin-width=&quot;120&quot; data-origin-height=&quot;49&quot;/&gt;&lt;/span&gt;&lt;/figure&gt;
&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;모든 오차가 &lt;b&gt;양수&lt;/b&gt;가 되고&lt;/li&gt;
&lt;li&gt;큰 오차는 더 크게 반영됩니다&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;예를 들어:&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;잔차&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;제곱 후&lt;/b&gt;&lt;/p&gt;
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody&gt;
&lt;tr&gt;
&lt;td&gt;+3&lt;/td&gt;
&lt;td&gt;9&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;-3&lt;/td&gt;
&lt;td&gt;9&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;+10&lt;/td&gt;
&lt;td&gt;100&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;어떤 방향으로 틀렸든(위든 아래든)&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;틀린 정도가 공평하게 반영&lt;/b&gt;되죠.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이걸 전체 데이터에 대해 더한 것이 바로:&lt;/p&gt;
&lt;p&gt;&lt;figure class=&quot;imageblock alignLeft&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;122&quot; data-origin-height=&quot;65&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/dRQYoq/dJMcachasKe/NeSmcF5NkWZakZD7jXZgL0/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/dRQYoq/dJMcachasKe/NeSmcF5NkWZakZD7jXZgL0/img.png&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/dRQYoq/dJMcachasKe/NeSmcF5NkWZakZD7jXZgL0/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2FdRQYoq%2FdJMcachasKe%2FNeSmcF5NkWZakZD7jXZgL0%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;122&quot; height=&quot;65&quot; data-origin-width=&quot;122&quot; data-origin-height=&quot;65&quot;/&gt;&lt;/span&gt;&lt;/figure&gt;
&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;OLS는 이 값을 가장 작게 만드는 &lt;b&gt;&amp;beta;₀, &amp;beta;₁&lt;/b&gt;을 찾는 방법입니다&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;3. &quot;그럼 제곱 말고 절댓값을 쓰면 되지 않나요?&quot;&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;정확한 질문입니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;실제로 &lt;b&gt;L1 회귀(Least Absolute Deviation)&lt;/b&gt;라는 방법은 오차의 절댓값을 최소화합니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;하지만 회귀분석의 기본으로 제곱을 사용하는 데에는 세 가지 이유가 있습니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;h4 data-ke-size=&quot;size20&quot;&gt;이유 1: 제곱은 수학적으로 미분이 쉽다&lt;/h4&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;회귀계수를 구하려면 미분을 해야 하는데,&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;제곱 함수는 매끄러운 곡선&lt;/b&gt;이기 때문에 미분이 간단합니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;반면 절댓값 함수는 0에서 '뾰족한 형태'라 미분 불가능한 지점이 있어요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;-&amp;gt; 계산 난이도가 크게 차이 납니다&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;-&amp;gt; 컴퓨터가 없던 시절부터 OLS가 표준이었던 이유&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;h4 data-ke-size=&quot;size20&quot;&gt;이유 2: 큰 오차에 가중치를 더 준다&lt;/h4&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;제조업, 엔지니어링에서는&lt;b&gt; 큰 오차가 매우 중요한 신호&lt;/b&gt;입니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;예를 들어 자동차의 제동거리 예측 모델에서:&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;대부분 차량은 &amp;plusmn;1m 내에서 예측&lt;/li&gt;
&lt;li&gt;어떤 차량은 10m 이상 차이&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;절댓값이면 10이지만, 제곱값이면 100이 됩니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이 말은 곧 큰 오차가 모델 선태에 크게 반영된다는 뜻이죠.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;-&amp;gt; 안전, 품질, 공정 문제를 빠르게 감지할 수 있음&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;h4 data-ke-size=&quot;size20&quot;&gt;이유 3: 이론적으로 '가장 좋은 성질'을 가진다&lt;/h4&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;정규분포를 따르는 오차가 있다고 가정하면,&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;OLS는 &lt;b&gt;최우추정법(MLE)과&lt;/b&gt; 동일해집니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;즉,&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;&quot;오차가 정규분포라고 가정하면, 제곱을 최소화하는 것이&lt;br /&gt;통계적으로 가장 좋은(최소분산) 추정치를 만든다.&quot;&lt;/blockquote&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이건 이론적으로 매우 탄탄한 근거예요.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;4. 자동차 예시로 직관을 잡아보자&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;차량 무게(X) -&amp;gt; 연비(Y) 관계를 모델링한다고 해봅시다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;아래 3가지 후보 회귀선을 생각해 보죠.&lt;/p&gt;
&lt;h4 data-ke-size=&quot;size20&quot;&gt;1. 대부분 점과 적당히 맞는 선&lt;/h4&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;-&amp;gt; 작은 오차들이 골고루 분포&lt;/p&gt;
&lt;h4 data-ke-size=&quot;size20&quot;&gt;2. 몇 개의 점은 잘 맞지만, 나머지는 크게 틀림&lt;/h4&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;-&amp;gt; 큰 오차가 있음&lt;/p&gt;
&lt;h4 data-ke-size=&quot;size20&quot;&gt;3. 전체적으로 오차가 크고 산만함&lt;/h4&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;제곱 오차의 합(SSR)을 계산하면:&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;A : 120&lt;/li&gt;
&lt;li&gt;B : 350&lt;/li&gt;
&lt;li&gt;C : 900&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;A가 가장 작은 값 -&amp;gt; A가 최소제곱법이 고른 회귀선&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;즉, &lt;b&gt;전체적으로 가장 균형 잡힌 모델&lt;/b&gt;을 선택해 주는 방법입니다.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;5. 한 장 요약&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;개념&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 의미&lt;/b&gt;&lt;/p&gt;
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody&gt;
&lt;tr&gt;
&lt;td&gt;제곱을 쓰는 이유&lt;/td&gt;
&lt;td&gt;부호 문제 해결, 큰 오차 강조, 계산 용이&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;절댓값 대신 제곱?&lt;/td&gt;
&lt;td&gt;미분 가능, 이론적 우수성&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;목적&lt;/td&gt;
&lt;td&gt;전체 오차(잔차)를 가장 작게 만드는 &amp;lsquo;최선의 선&amp;rsquo;을 찾기&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;결과&lt;/td&gt;
&lt;td&gt;회귀계수 &amp;beta;₀, &amp;beta;₁이 계산됨&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style1&quot;&gt;&lt;span style=&quot;font-family: 'Noto Serif KR';&quot;&gt;&quot;최소제곱법은 오차를 정직하게 반영해서&lt;br /&gt;&lt;/span&gt;가장 현실적인 회귀선을 뽑아내는 방법이다.&quot;&lt;/blockquote&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;</description>
      <category>Statistics/기초 통계</category>
      <category>OLS</category>
      <category>데이터분석</category>
      <category>데이터사이언스</category>
      <category>오차</category>
      <category>잔차</category>
      <category>절댓값</category>
      <category>최소제곱법</category>
      <category>통계</category>
      <author>Allen93</author>
      <guid isPermaLink="true">https://allensdatablog.tistory.com/474</guid>
      <comments>https://allensdatablog.tistory.com/entry/18-%EC%B5%9C%EC%86%8C%EC%A0%9C%EA%B3%B1%EB%B2%95%EC%9D%98-%EC%A7%81%EA%B4%80-%EC%99%9C-%EC%A0%9C%EA%B3%B1%EC%9D%84-%EC%B5%9C%EC%86%8C%ED%99%94%ED%95%A0%EA%B9%8C#entry474comment</comments>
      <pubDate>Mon, 26 Jan 2026 16:47:20 +0900</pubDate>
    </item>
    <item>
      <title>17. 상관관계 vs 인과관계 - 함께 움직인다고 원인은 아니다</title>
      <link>https://allensdatablog.tistory.com/entry/17-%EC%83%81%EA%B4%80%EA%B4%80%EA%B3%84-vs-%EC%9D%B8%EA%B3%BC%EA%B4%80%EA%B3%84-%ED%95%A8%EA%BB%98-%EC%9B%80%EC%A7%81%EC%9D%B8%EB%8B%A4%EA%B3%A0-%EC%9B%90%EC%9D%B8%EC%9D%80-%EC%95%84%EB%8B%88%EB%8B%A4</link>
      <description>&lt;p&gt;&lt;figure class=&quot;imageblock alignCenter&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;1024&quot; data-origin-height=&quot;1024&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/cADzHY/dJMcaf51AFc/8BxYY0gPQJ2LDfkn6IFNbk/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/cADzHY/dJMcaf51AFc/8BxYY0gPQJ2LDfkn6IFNbk/img.png&quot; data-alt=&quot;상관관계-인과관계&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/cADzHY/dJMcaf51AFc/8BxYY0gPQJ2LDfkn6IFNbk/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2FcADzHY%2FdJMcaf51AFc%2F8BxYY0gPQJ2LDfkn6IFNbk%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;525&quot; height=&quot;525&quot; data-origin-width=&quot;1024&quot; data-origin-height=&quot;1024&quot;/&gt;&lt;/span&gt;&lt;figcaption&gt;상관관계-인과관계&lt;/figcaption&gt;
&lt;/figure&gt;
&lt;/p&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;1. 둘이 비슷해 보여도 완전히 다른 개념&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;먼저 가장 짧고 명확한 정의부터 해볼게요.&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;상관관계 : 두 변수가 함께 움직이는 패턴이 있다&lt;/li&gt;
&lt;li&gt;인과관계 : 한 변수가 다른 변수를 변화시킨다&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;예시를 들어볼게요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&lt;b&gt;자동차 회사 예시 1&lt;/b&gt;&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;차량 가격 상승&lt;/li&gt;
&lt;li&gt;옵션 개수 상승&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;두 변수는 분명 &lt;b&gt;상관관계&lt;/b&gt;가 있습니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;하지만 &quot;가격이 올라서 옵션이 늘었다&quot;라고 단정하긴 어렵습니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;오히려 &lt;b&gt;옵션이 많아서 가격이 올라간 것&lt;/b&gt;이 정확하겠죠?&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;즉, &lt;b&gt;같이 움직인다고 해서 원인, 결과라고 단정할 수는 없습니다.&lt;/b&gt;&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;2. 상관관계는 방향을 알려주지 않는다&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;상관계수 r은 아래와 같이 생겼습니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&lt;b&gt; &lt;span&gt;&lt;span&gt;&amp;minus;&lt;/span&gt;&lt;span&gt;1 &lt;/span&gt;&lt;span&gt;&amp;le; &lt;/span&gt;&lt;/span&gt;&lt;span&gt;&lt;span&gt;r &lt;/span&gt;&lt;span&gt;&amp;le; &lt;/span&gt;&lt;/span&gt;&lt;span&gt;&lt;span&gt;1&lt;/span&gt;&lt;/span&gt; &lt;/b&gt;&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;r &amp;gt; 0 -&amp;gt; 함께 증가하거나 감소 (양의 상관)&lt;/li&gt;
&lt;li&gt;r &amp;lt; 0 -&amp;gt; 한쪽은 증가, 한쪽은 감소 (음의 상관)&lt;/li&gt;
&lt;li&gt;r &amp;asymp; 0 -&amp;gt; 패턴 없음&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;하지만 우리가 절대 알 수 없는 게 있습니다.&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;&quot;무엇이 무엇에 영향을 주는가?&quot;&lt;/blockquote&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;예를 들어 자동차 시장 데이터를 보면,&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;801&quot; data-start=&quot;793&quot;&gt;마력 &amp;uarr;&lt;/li&gt;
&lt;li data-end=&quot;810&quot; data-start=&quot;802&quot;&gt;연비 &amp;darr;&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이런 음의 상관관계가 보이지만, 이게&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&quot;마력이 높아서 연비가 낮다&quot;인지,&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&quot;연비 좋은 차는 마력을 낮게 설계하는 경향 때문인지&quot;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;데이터만으로는 판단할 수 없습니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;상관관계는 &lt;b&gt;함께 움직임만 보여줄 뿐,&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;방향(원인 -&amp;gt;결과)을 알려주진 않아요.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;3. 상관관계는 '숨은 변수'에 쉽게 속는다&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이게 사람들이 가장 많이 놓치는 포인트입니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&lt;b&gt;자동차 예시 2&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;데이터를 보니:&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;1062&quot; data-start=&quot;1047&quot;&gt;차량 크기(전장) &amp;uarr;&lt;/li&gt;
&lt;li data-end=&quot;1076&quot; data-start=&quot;1063&quot;&gt;CO₂ 배출량 &amp;uarr;&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;그래서 &quot;차가 커서 &lt;span style=&quot;color: #333333; text-align: start;&quot;&gt;CO₂&lt;span&gt; 가 늘어난다!&quot;라고 말하고 싶겠지만&lt;/span&gt;&lt;/span&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;span style=&quot;color: #333333; text-align: start;&quot;&gt;&lt;span&gt;아래와 같은 것이 숨어 있을 수도 있습니다.&lt;/span&gt;&lt;/span&gt;&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;차가 크면 엔진도 큼&lt;/li&gt;
&lt;li&gt;엔진이 크면 연료 소모량이 많음&lt;/li&gt;
&lt;li&gt;그래서 CO₂ 배출량 증가&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;span style=&quot;color: #333333; text-align: start;&quot;&gt;&lt;span&gt;&lt;span style=&quot;color: #333333; text-align: start;&quot;&gt;&lt;span&gt;즉, 엔진 크기라는 또 다른 변수가 둘 사이의 관계를 만들어낸 것.&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;span style=&quot;color: #333333; text-align: start;&quot;&gt;&lt;span&gt;&lt;span style=&quot;color: #333333; text-align: start;&quot;&gt;&lt;span&gt;이걸 &lt;b&gt;교란변수(confounder)&lt;/b&gt;라고 부릅니다.&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;상관관계는 교란변수 하나에 의해 완전히 왜곡될 수 있다.&lt;/blockquote&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;4. 인과관계를 말하려면 &quot;조건부 비교&quot;가 필요하다&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;인과관계를 말하기 위해서는&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&quot;나머지 조건이 같을 때&quot; 한 변수의 효과를 보는 과정이 필요합니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이걸 가능하게 하는 게:&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;통계에서는 &lt;b&gt;회귀분석&lt;/b&gt;&lt;/li&gt;
&lt;li&gt;실험에서는 &lt;b&gt;통제된 실험(Controlled Experiment)&lt;/b&gt;&lt;/li&gt;
&lt;li&gt;비실험적 데이터에서는 &lt;b&gt;매칭, 성향점수, 도구변수&lt;/b&gt; 같은 기법들&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;예를 들어 자동차의 연비에 영향을 준다고 주장하려면:&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;&quot;차량 무게가 100kg 늘어났을 때,&lt;br /&gt;엔진 크기, 타이어 종류, 변속기 등 다른 조건이 같다면&lt;br /&gt;연비가 얼마나 변하는가?&quot;&lt;/blockquote&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이런 식의 &quot;조건부 비교(conditional comparison)&quot;가 필요합니다.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;5. 실무에서 상관관계를 인과처럼 착각하는 흔한 예&lt;/h3&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&lt;b&gt;1. 광고비&amp;uarr; &amp;rarr; 매출 &amp;uarr;&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;많이들 이렇게 결론을 내리지만,&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&quot;광고비가 높아진 시기는 원래 매출도 상승하는 시즌이었을 수도&quot;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;즉, &lt;b&gt;계절성&lt;/b&gt;이 교란변수일 수 있음.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&lt;b&gt;2. 공장 조도(밝기) &amp;uarr; &amp;rarr; 작업품질 &amp;uarr;&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;밝기가 원인일까?&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;아니면 조도 개선 시기에 &quot;설비 정비&quot;가 함께 이뤄졌을까?&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;조건 통제가 없다면 판단 불가능.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&lt;b&gt;3. 온도 &amp;uarr; &amp;rarr; 제품 불량 &amp;uarr; &lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;온도 자체가 문제일 수도 있지만,&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;온도가 높을 때 함께 발생하는 &quot;장비 과부하&quot;가 문제일 수도 있습니다.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;6. 자동차 예시로 한 번에 정리해 보자&lt;/h3&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&lt;b&gt;예시: &quot;타이어 공기압이 높으면 연비가 좋아진다?&quot;&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;단순 상관만 보면 이렇게 나올 수 있습니다.&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;공기압 높음 &amp;lt;-&amp;gt; 연비 좋음 -&amp;gt; 상관관계있음&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;하지만 왜일까?&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;공기압이 높은 운전자들은&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;관리 습관이 전반적으로 좋을 가능성이 높다&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; -&amp;gt; 엔진오일, 타이어 마모도, 급가속 습관 등도 더 좋을 수 있음&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;즉,&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;연비 상승의 진짜 원인은 운전 습관일 수도 있다.&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;그래서 우리는 &quot;상관&quot;만 가지고 인과를 말할 수 없다.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;7. 그럼 인과관계는 어떻게 증명할까?&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;크게 세 가지 방법이 있습니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&lt;b&gt;1. 무작위 실험(Randomized Controlled Trial)&lt;/b&gt;&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;모든 변수 통제&lt;/li&gt;
&lt;li&gt;유일하게 조작한 변수만 차이&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; -&amp;gt; &lt;b&gt;가장 확실한 방법&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;하지만 제조업/현업에서는 거의 불가능합니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&lt;b&gt;2. 통계적 통제 (회귀분석)&lt;/b&gt;&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;다른 영향을 줄 변수들을 함께 넣습니다.&lt;/li&gt;
&lt;li&gt;특정 변수의 '순수한 영향력'을 추정합니다&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; -&amp;gt; 실무에서 가장 널기 사용&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&lt;b&gt;3. 준실험적 기법(Quasi-Experiments)&lt;/b&gt;&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;성향점수 매칭(PSM)&lt;/li&gt;
&lt;li&gt;차이의 차이(DID)&lt;/li&gt;
&lt;li&gt;도구변수(IV)&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp; &amp;nbsp; &amp;nbsp;-&amp;gt;관측데이터에서 인과관계를 추론하는 방법&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;8. 한 장 요약&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;개념&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;의미&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 중요한 점&lt;/b&gt;&lt;/p&gt;
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody&gt;
&lt;tr&gt;
&lt;td&gt;상관관계&lt;/td&gt;
&lt;td&gt;두 변수의 함께 움직임&lt;/td&gt;
&lt;td&gt;원인&amp;middot;결과를 말하지 못함&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;인과관계&lt;/td&gt;
&lt;td&gt;한 변수가 다른 변수를 변화시킴&lt;/td&gt;
&lt;td&gt;&amp;ldquo;조건 동일&amp;rdquo;이 핵심&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;교란변수&lt;/td&gt;
&lt;td&gt;둘 사이의 관계를 왜곡하는 제3의 변수&lt;/td&gt;
&lt;td&gt;통제하지 않으면 인과 해석 불가&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;회귀분석&lt;/td&gt;
&lt;td&gt;변수의 순수한 영향력 추정&lt;/td&gt;
&lt;td&gt;비인과적 관계 필터링&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;인과추론&lt;/td&gt;
&lt;td&gt;실험 또는 준실험이 핵심&lt;/td&gt;
&lt;td&gt;데이터만 보면 잘못된 결론 나올 수 있음&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;</description>
      <category>Statistics/기초 통계</category>
      <category>교란변수</category>
      <category>데이터분석</category>
      <category>데이터사이언스</category>
      <category>데이터해석</category>
      <category>상관관계</category>
      <category>인과관계</category>
      <category>인과추론</category>
      <category>통계</category>
      <category>회귀분석</category>
      <author>Allen93</author>
      <guid isPermaLink="true">https://allensdatablog.tistory.com/473</guid>
      <comments>https://allensdatablog.tistory.com/entry/17-%EC%83%81%EA%B4%80%EA%B4%80%EA%B3%84-vs-%EC%9D%B8%EA%B3%BC%EA%B4%80%EA%B3%84-%ED%95%A8%EA%BB%98-%EC%9B%80%EC%A7%81%EC%9D%B8%EB%8B%A4%EA%B3%A0-%EC%9B%90%EC%9D%B8%EC%9D%80-%EC%95%84%EB%8B%88%EB%8B%A4#entry473comment</comments>
      <pubDate>Fri, 23 Jan 2026 10:30:22 +0900</pubDate>
    </item>
    <item>
      <title>16. 결정계수(R&amp;sup2;)와 잔차 - &amp;quot;모델이 얼마나 잘 맞았을까?&amp;quot;</title>
      <link>https://allensdatablog.tistory.com/entry/16-%EA%B2%B0%EC%A0%95%EA%B3%84%EC%88%98R%C2%B2%EC%99%80-%EC%9E%94%EC%B0%A8-%EB%AA%A8%EB%8D%B8%EC%9D%B4-%EC%96%BC%EB%A7%88%EB%82%98-%EC%9E%98-%EB%A7%9E%EC%95%98%EC%9D%84%EA%B9%8C</link>
      <description>&lt;p&gt;&lt;figure class=&quot;imageblock alignCenter&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;1024&quot; data-origin-height=&quot;1024&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/bVAXgS/dJMcaaRaOzs/VxmeLwS6MXw4pNeVKgnyE0/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/bVAXgS/dJMcaaRaOzs/VxmeLwS6MXw4pNeVKgnyE0/img.png&quot; data-alt=&quot;결정계수와 잔차&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/bVAXgS/dJMcaaRaOzs/VxmeLwS6MXw4pNeVKgnyE0/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2FbVAXgS%2FdJMcaaRaOzs%2FVxmeLwS6MXw4pNeVKgnyE0%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;555&quot; height=&quot;555&quot; data-origin-width=&quot;1024&quot; data-origin-height=&quot;1024&quot;/&gt;&lt;/span&gt;&lt;figcaption&gt;결정계수와 잔차&lt;/figcaption&gt;
&lt;/figure&gt;
&lt;/p&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;&amp;nbsp;&lt;/h3&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;1. 예측은 했는데... 얼마나 믿을 수 있을까?&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;자동차 회사에서 이런 모델을 만들었다고 해봅시다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;Y&lt;/span&gt;&lt;/span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;^ &lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span&gt;= &lt;/span&gt;&lt;/span&gt;&lt;span&gt;&lt;span&gt;25.4 &lt;/span&gt;&lt;span&gt;&amp;minus; &lt;/span&gt;&lt;/span&gt;&lt;span&gt;&lt;span&gt;0.006&lt;/span&gt;&lt;span&gt;X&lt;/span&gt;&lt;/span&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;span&gt;&lt;span&gt;여기서&lt;/span&gt;&lt;/span&gt;&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;Y: 연비 (km/L)&lt;/li&gt;
&lt;li&gt;X: 차량 무게 (kg)&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;모델은 &quot;차가 무거울수록 연비가 떨어진다&quot;라고 말합니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;그런데 실제 데이터에 찍힌 점들은 회귀선 근처에 흩어져 있겠죠.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;그럼 이제 물어볼 차례예요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;&quot;이 선이 실제 데이터를 얼마나 잘 설명하고 있을까?&quot;&lt;/blockquote&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;그 답이 바로 &lt;b&gt;결정계수(R&amp;sup2;)&lt;/b&gt; 입니다.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;2. R&amp;sup2;의 의미 - 설명력의 비율&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;결정계수는 이렇게 정의됩니다.&lt;/p&gt;
&lt;p&gt;&lt;figure class=&quot;imageblock alignLeft&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;227&quot; data-origin-height=&quot;66&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/HqiYM/dJMcahpecXv/ms3ZPIOAlIjjdYyGsCdZ1k/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/HqiYM/dJMcahpecXv/ms3ZPIOAlIjjdYyGsCdZ1k/img.png&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/HqiYM/dJMcahpecXv/ms3ZPIOAlIjjdYyGsCdZ1k/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2FHqiYM%2FdJMcahpecXv%2Fms3ZPIOAlIjjdYyGsCdZ1k%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;227&quot; height=&quot;66&quot; data-origin-width=&quot;227&quot; data-origin-height=&quot;66&quot;/&gt;&lt;/span&gt;&lt;/figure&gt;
&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;조금 말로 풀면 이렇습니다&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;&quot;데이터의 전체 변동 중에서, 회귀모형이 설명한 비율.&quot;&lt;br /&gt;&lt;br /&gt;&lt;/blockquote&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;구분&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 의미&lt;/b&gt;&lt;/p&gt;
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody&gt;
&lt;tr&gt;
&lt;td&gt;SST (Total Sum of Squares)&lt;/td&gt;
&lt;td&gt;전체 데이터의 변동량&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;SSR (Sum of Squared Residuals)&lt;/td&gt;
&lt;td&gt;모델이 설명하지 못한 오차&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;R&amp;sup2;&lt;/td&gt;
&lt;td&gt;모델이 설명한 비율 = (1 - SSR/SST)&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;3. 예를 들어볼게요&lt;/h3&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;SST = 100 (데이터 전체의 변동)&lt;/li&gt;
&lt;li&gt;SSR = 20 (모델이 못 맞춘 부분)&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;그럼 &lt;b&gt;R&amp;sup2; = 0.8이면 꽤 잘 맞는 모델&lt;/b&gt;이고,&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;R&amp;sup2; = 0.3이라면 &quot;데이터의 30%밖에 설명 못한다&quot;는 뜻이에요.&lt;/blockquote&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;4. 하지만 R&amp;sup2; 만 믿으면 안 돼요&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;많은 사람들이 R&amp;sup2; 를 &quot;높을수록 무조건 좋은 모델&quot;로 오해해요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;그건 절반만 맞는 말이에요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;예를 들어, 변수를 아무거나 계속 넣으면 R&amp;sup2;는 무조건 올라갑니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;하지만 설명력이 진짜 올라간 건 아닙니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;그래서 &lt;b&gt;보정된 결정계수(Adjusted R&amp;sup2;)라는&lt;/b&gt; 개념이 나왔어요.&lt;/p&gt;
&lt;p&gt;&lt;figure class=&quot;imageblock alignLeft&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;269&quot; data-origin-height=&quot;60&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/mVEt9/dJMcain8tmV/XlY0KrBmyQVSqJ7E2OJVgK/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/mVEt9/dJMcain8tmV/XlY0KrBmyQVSqJ7E2OJVgK/img.png&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/mVEt9/dJMcain8tmV/XlY0KrBmyQVSqJ7E2OJVgK/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2FmVEt9%2FdJMcain8tmV%2FXlY0KrBmyQVSqJ7E2OJVgK%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;269&quot; height=&quot;60&quot; data-origin-width=&quot;269&quot; data-origin-height=&quot;60&quot;/&gt;&lt;/span&gt;&lt;/figure&gt;
&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;기호&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 의미&lt;/b&gt;&lt;/p&gt;
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody&gt;
&lt;tr&gt;
&lt;td&gt;n&lt;/td&gt;
&lt;td&gt;표본 개수&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;k&lt;/td&gt;
&lt;td&gt;독립변수 개수&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;보정된 R&amp;sup2;는 변수가 늘어나면 페널티를 줍니다.&lt;br /&gt;즉, 진짜 설명력이 올라간 경우에만 함께 상승하죠.&lt;/blockquote&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;5. 잔차(residual)란 무엇인가?&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;모델은 예측값(y^)을 만들어냅니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;하지만 현실의 값(Y)은 그 예측과 항상 조금 다릅니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;​&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/p&gt;
&lt;p&gt;&lt;figure class=&quot;imageblock alignLeft&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;111&quot; data-origin-height=&quot;34&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/cOJyzc/dJMcabP45rj/xyGjoGTA7GDXNWo2ZQFQt1/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/cOJyzc/dJMcabP45rj/xyGjoGTA7GDXNWo2ZQFQt1/img.png&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/cOJyzc/dJMcabP45rj/xyGjoGTA7GDXNWo2ZQFQt1/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2FcOJyzc%2FdJMcabP45rj%2FxyGjoGTA7GDXNWo2ZQFQt1%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;111&quot; height=&quot;34&quot; data-origin-width=&quot;111&quot; data-origin-height=&quot;34&quot;/&gt;&lt;/span&gt;&lt;/figure&gt;
&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이 &lt;span&gt;ei가 바로 &lt;b&gt;잔차(residual)&lt;/b&gt;입니다.&lt;/span&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;span&gt;잔차는 &quot;모델이 틀린 정도&quot;를 의미해요.&lt;/span&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;상황&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;해석&lt;/b&gt;&lt;/p&gt;
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody&gt;
&lt;tr&gt;
&lt;td&gt;잔차가 작음&lt;/td&gt;
&lt;td&gt;예측이 잘 맞음&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;잔차가 큼&lt;/td&gt;
&lt;td&gt;모델이 못 맞춤&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;잔차가 일정한 패턴&lt;/td&gt;
&lt;td&gt;모델 구조에 문제 있음&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;6. 잔차는 '남은 이야기'를 들려준다&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;잔차를 그래프로 그려보면&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;X축에는 예측값(y^), Y축에는 잔차(e)가 찍힙니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;좋은 회귀모형이라면 이렇게 보여야 해요.&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;잔차가 &lt;b&gt;0을 중심으로 랜덤 하게 흩어져 있음&lt;/b&gt;&lt;/li&gt;
&lt;li&gt;어떤 규칙적인 패턴도 없음&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;반대로 이런 모양이면 경고예요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;잔차 패턴&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 의미&lt;/b&gt;&lt;/p&gt;
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody&gt;
&lt;tr&gt;
&lt;td&gt;곡선 형태&lt;/td&gt;
&lt;td&gt;비선형 관계를 직선으로 억지로 맞춤&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;점점 넓어짐&lt;/td&gt;
&lt;td&gt;분산이 일정하지 않음 (이분산성)&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;특정 구간만 위/아래&lt;/td&gt;
&lt;td&gt;누락된 변수나 상호작용 있음&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;즉, 잔차는 &quot;모델이 놓친 부분&quot;을 시각적으로 보여주는 거예요.&lt;/blockquote&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;7. 자동차 예시로 보자&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;자동차의 &lt;b&gt;연비 예측 모델&lt;/b&gt;에서 잔차를 분석해 보면:&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;경차, 소형차 구간 : 잔차가 대부분 0 근처 -&amp;gt; 잘 맞음&lt;/li&gt;
&lt;li&gt;SUV 구간 : 잔차가 음수로 큼 -&amp;gt; 실제 연비가 예측보다 훨씬 낮음&lt;/li&gt;
&lt;li&gt;스포츠카 구간 : 잔차가 양수 -&amp;gt; 예측보다 연비가 좋음&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;즉, 모델이 &quot;고성능 차량의 특성&quot;을 반영하지 못한 거예요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이런 걸 보고 우리는 모델을 개선하죠.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;(예: 엔진 형식, 공기저항, 구동방식 등 변수를 추가)&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;8. 잔차 분석은 '모델 점검표'다&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;점검 항목&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 이상적인 모습&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 문제 시 조치&lt;/b&gt;&lt;/p&gt;
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody&gt;
&lt;tr&gt;
&lt;td&gt;잔차 평균&lt;/td&gt;
&lt;td&gt;0 근처&lt;/td&gt;
&lt;td&gt;회귀식 재확인&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;분포 형태&lt;/td&gt;
&lt;td&gt;대칭적&lt;/td&gt;
&lt;td&gt;비선형 항 추가&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;분산 패턴&lt;/td&gt;
&lt;td&gt;일정함&lt;/td&gt;
&lt;td&gt;로그변환&amp;middot;이분산 보정&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;이상치 존재&lt;/td&gt;
&lt;td&gt;거의 없음&lt;/td&gt;
&lt;td&gt;영향력 점검 (Cook&amp;rsquo;s D 등)&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;좋은 모델은 R&amp;sup2;가 높고,&lt;br /&gt;나쁜 모델은 잔차가 특이점이 많습니다.&lt;/blockquote&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;9. 한 장 요약&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;개념&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 의미&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 핵심 포인트&lt;/b&gt;&lt;/p&gt;
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody&gt;
&lt;tr&gt;
&lt;td&gt;R&amp;sup2;&lt;/td&gt;
&lt;td&gt;모델이 데이터를 얼마나 설명하는가&lt;/td&gt;
&lt;td&gt;1에 가까울수록 설명력 &amp;uarr;&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;보정된 R&amp;sup2;&lt;/td&gt;
&lt;td&gt;불필요한 변수에 페널티 적용&lt;/td&gt;
&lt;td&gt;다중회귀에 필수&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;잔차&lt;/td&gt;
&lt;td&gt;모델의 예측 오차&lt;/td&gt;
&lt;td&gt;패턴이 없어야 정상&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;잔차 분석&lt;/td&gt;
&lt;td&gt;모델의 문제 진단&lt;/td&gt;
&lt;td&gt;비선형&amp;middot;이분산&amp;middot;이상치 점검&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;</description>
      <category>Statistics/기초 통계</category>
      <category>R2</category>
      <category>결정계수</category>
      <category>기초통계학</category>
      <category>데이터분석</category>
      <category>모델진단</category>
      <category>보정</category>
      <category>잔차</category>
      <category>잔차분석</category>
      <category>회귀분석</category>
      <author>Allen93</author>
      <guid isPermaLink="true">https://allensdatablog.tistory.com/472</guid>
      <comments>https://allensdatablog.tistory.com/entry/16-%EA%B2%B0%EC%A0%95%EA%B3%84%EC%88%98R%C2%B2%EC%99%80-%EC%9E%94%EC%B0%A8-%EB%AA%A8%EB%8D%B8%EC%9D%B4-%EC%96%BC%EB%A7%88%EB%82%98-%EC%9E%98-%EB%A7%9E%EC%95%98%EC%9D%84%EA%B9%8C#entry472comment</comments>
      <pubDate>Tue, 20 Jan 2026 11:49:52 +0900</pubDate>
    </item>
    <item>
      <title>15. 회귀계수의 의미 - 단순한 숫자에서 '통계적 근거'로</title>
      <link>https://allensdatablog.tistory.com/entry/15-%ED%9A%8C%EA%B7%80%EA%B3%84%EC%88%98%EC%9D%98-%EC%9D%98%EB%AF%B8-%EB%8B%A8%EC%88%9C%ED%95%9C-%EC%88%AB%EC%9E%90%EC%97%90%EC%84%9C-%ED%86%B5%EA%B3%84%EC%A0%81-%EA%B7%BC%EA%B1%B0%EB%A1%9C</link>
      <description>&lt;p&gt;&lt;figure class=&quot;imageblock alignCenter&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;1024&quot; data-origin-height=&quot;1024&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/bYSk0E/dJMcaawRESA/JQTKgBAWB9fDFdYIMyBdSk/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/bYSk0E/dJMcaawRESA/JQTKgBAWB9fDFdYIMyBdSk/img.png&quot; data-alt=&quot;회귀계수&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/bYSk0E/dJMcaawRESA/JQTKgBAWB9fDFdYIMyBdSk/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2FbYSk0E%2FdJMcaawRESA%2FJQTKgBAWB9fDFdYIMyBdSk%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;589&quot; height=&quot;589&quot; data-origin-width=&quot;1024&quot; data-origin-height=&quot;1024&quot;/&gt;&lt;/span&gt;&lt;figcaption&gt;회귀계수&lt;/figcaption&gt;
&lt;/figure&gt;
&lt;/p&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;1. 회귀계수, 단순한 기울기일까?&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;지난 글에서 이런 식을 봤죠:&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p style=&quot;text-align: center;&quot; data-ke-size=&quot;size18&quot;&gt;&lt;b&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;Y&lt;/span&gt;&lt;/span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;^ &lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span&gt;= &lt;/span&gt;&lt;/span&gt;&lt;span&gt;&lt;span&gt;28.5 &lt;/span&gt;&lt;span&gt;&amp;minus; &lt;/span&gt;&lt;/span&gt;&lt;span&gt;&lt;span&gt;0.006&lt;/span&gt;&lt;span&gt;&lt;span&gt;X₁ &lt;/span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;​&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span&gt;&amp;minus; &lt;/span&gt;&lt;/span&gt;&lt;span&gt;&lt;span&gt;0.003&lt;/span&gt;&lt;span&gt;&lt;span&gt;X&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;₂ &lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span&gt;&lt;span&gt;+ &lt;/span&gt;&lt;/span&gt;&lt;/b&gt;&lt;span&gt;&lt;b&gt;&lt;span&gt;1.2&lt;/span&gt;&lt;/b&gt;&lt;span&gt;&lt;b&gt;&lt;span&gt;X&lt;/span&gt;&lt;/b&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;b&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;₃ &lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/b&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;​이때,&lt;/span&gt;&lt;/span&gt;&lt;span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;X₁&amp;nbsp;: 차량 무게(kg)&lt;/li&gt;
&lt;li&gt;X₂ : 엔진 배기량 (cc)&lt;/li&gt;
&lt;li&gt;X₃ : 변속기 (자동 = 1, 수동 = 0)&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;여기서 숫자들(-0.006, -0.003, +1.2)이 바로 &lt;b&gt;회귀계수(&amp;beta;)&lt;/b&gt; 입니다.&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;단순히 &quot;기울기&quot;지만, 실제로는 더 중요한 의미가 있어요.&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;&lt;b&gt; &amp;beta;₁ = 다른 조건이 같을 때 X₁ 이 Y에 미치는 평균적 영향.&lt;/b&gt;&lt;br /&gt;즉, &quot;차량 무게가 1kg 늘면 연비가 평균적으로 얼마나 줄어드는가?&quot;를 말해줍니다.&lt;/blockquote&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이걸 &lt;b&gt;부분표과(partial effect)&lt;/b&gt;라고 불러요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;다중회귀에서는 &quot;나머지 변수들이 고정되어 있을 때&quot;라는 조건이 항상 붙습니다.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;2. 그런데... 이 &amp;beta;₁이 '진짜'일까?&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;데이터에는 항상 변동(노이즈)이 있죠.&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;그래서 &amp;beta;₁ = -0.006이라는 값도 표본에 따라 조금씩 달라집니다.&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;이 말은 곧,&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;&quot;우리가 구한 계수는 모집단의 진짜 영향력을 근사한 것&quot;&lt;br /&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;이라는 뜻이에요.&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/blockquote&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;그럼 이 값을 신뢰할 수 있는지 검증해야겠죠?&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;여기서 &lt;b&gt;신뢰구간(confidence interval)&lt;/b&gt;과 &lt;b&gt;t검정(t-test)&lt;/b&gt;이 등장합니다.&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h2 data-ke-size=&quot;size26&quot;&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;3. 신뢰구간 : 우리가 믿는 범위&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/h2&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;예를 들어,&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&quot;차량 무게가 1kg 늘 때 연비가 0.006km/L 줄어든다.&quot;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;이 결과의 &lt;b&gt;95% 신뢰구간&lt;/b&gt;이 [-0.009, -0.003]이라면 이렇게 해석합니다:&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;&quot;진짜 효과는 -0.009와 -0.003 사이 어딘가에 있을 것이다.&quot;&lt;/blockquote&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;즉, 이 범위 안에서는 확실히 음의 관계(-)죠.&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;-&amp;gt; &lt;b&gt;무게가 늘면 연비는 확실히 줄어든다&lt;/b&gt;고 말할 수 있습니다.&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;만약 신뢰구간이 [-0.005, +0.002]라면?&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;0이 포함돼요.&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;즉, &quot;연비가 줄어드는지, 아닌지 확실하지 않다.&quot;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;-&amp;gt; 통계적으로 유의하지 않다는 뜻입니다.&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;4. t검정: 관계의 '유의성'을 묻다&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;회귀계수 &amp;beta;의 t검정 공식은 다음과 같습니다.&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/p&gt;
&lt;p&gt;&lt;figure class=&quot;imageblock alignLeft&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;108&quot; data-origin-height=&quot;65&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/cPOTvz/dJMcajm2pDn/RaX4vmVshz2hKibiCaR1i0/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/cPOTvz/dJMcajm2pDn/RaX4vmVshz2hKibiCaR1i0/img.png&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/cPOTvz/dJMcajm2pDn/RaX4vmVshz2hKibiCaR1i0/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2FcPOTvz%2FdJMcajm2pDn%2FRaX4vmVshz2hKibiCaR1i0%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;108&quot; height=&quot;65&quot; data-origin-width=&quot;108&quot; data-origin-height=&quot;65&quot;/&gt;&lt;/span&gt;&lt;/figure&gt;
&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;항목&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 의미&lt;/b&gt;&lt;/p&gt;
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody&gt;
&lt;tr&gt;
&lt;td&gt;&lt;span&gt;&amp;beta;^i&lt;/span&gt;&lt;/td&gt;
&lt;td&gt;추정된 회귀계수&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;&lt;span&gt;SE&lt;/span&gt;&lt;span&gt;(&lt;/span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&amp;beta;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;^i&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span&gt;​&lt;/span&gt;&lt;/span&gt;&lt;span&gt;&lt;span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span&gt;)&lt;/span&gt;&lt;/td&gt;
&lt;td&gt;그 계수의 표준오차 (불확실성)&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;이 t값이 크면 -&amp;gt; &amp;beta;가 0일 가능성이 매우 낮음 -&amp;gt; &lt;b&gt;유의하다&lt;/b&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;보통 기준은 p &amp;lt; 0.05, 즉 5% 이하의 확률만 허용합니다.&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;요약하면:&lt;br /&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;t값이 크고, 신뢰구간이 0을 포함하지 않으면&lt;br /&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;-&amp;gt; &quot;이 변수는 결과에 유의미한 영향을 준다.&quot;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/blockquote&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h2 data-ke-size=&quot;size26&quot;&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;5. 실제 예시로 직관 잡기&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/h2&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;자동차 연비 분석 결과가 아래처럼 나왔다고 합시다.&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;변수&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;계수(&amp;beta;̂)&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;표준오차&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; t값&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;p값&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 95% 신뢰구간&lt;/b&gt;&lt;/p&gt;
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody&gt;
&lt;tr&gt;
&lt;td&gt;절편&lt;/td&gt;
&lt;td&gt;28.5&lt;/td&gt;
&lt;td&gt;1.2&lt;/td&gt;
&lt;td&gt;23.7&lt;/td&gt;
&lt;td&gt;0.000&lt;/td&gt;
&lt;td&gt;[26.1, 30.9]&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;무게&lt;/td&gt;
&lt;td&gt;&amp;minus;0.006&lt;/td&gt;
&lt;td&gt;0.002&lt;/td&gt;
&lt;td&gt;&amp;minus;3.0&lt;/td&gt;
&lt;td&gt;0.004&lt;/td&gt;
&lt;td&gt;[&amp;minus;0.010, &amp;minus;0.002]&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;배기량&lt;/td&gt;
&lt;td&gt;&amp;minus;0.003&lt;/td&gt;
&lt;td&gt;0.0015&lt;/td&gt;
&lt;td&gt;&amp;minus;2.0&lt;/td&gt;
&lt;td&gt;0.048&lt;/td&gt;
&lt;td&gt;[&amp;minus;0.006, &amp;minus;0.0001]&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;변속기&lt;/td&gt;
&lt;td&gt;+1.2&lt;/td&gt;
&lt;td&gt;0.5&lt;/td&gt;
&lt;td&gt;2.4&lt;/td&gt;
&lt;td&gt;0.018&lt;/td&gt;
&lt;td&gt;[0.2, 2.2]&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;해석은 아래와 같이 하면 됩니다&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;무게 : p = 0.004 &amp;lt; 0.05 -&amp;gt; 유의함.&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&amp;nbsp; &amp;nbsp; &amp;nbsp; -&amp;gt; 무거워질수록 연비 감소 확실.&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;배기량 : 경계선 수준 (p&amp;asymp;0.048).&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp; &amp;nbsp; &amp;nbsp; -&amp;gt; 영향은 있지만 강하지 않음.&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;변속기 : 자동일수록 연비 상승 ( 확실한 양의 효과).&lt;/li&gt;
&lt;li&gt;절편 : 의미 없음.(무게 0kg 자동차는 없으니까요.)&lt;/li&gt;
&lt;/ul&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;6. 신뢰구간 vs 유의성 - 같은 말을 다르게 보는 법&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;관점&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;기준&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 해석 방식&lt;/b&gt;&lt;/p&gt;
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody&gt;
&lt;tr&gt;
&lt;td&gt;&lt;b&gt;t검정/p값&lt;/b&gt;&lt;/td&gt;
&lt;td&gt;p &amp;lt; 0.05&lt;/td&gt;
&lt;td&gt;&amp;ldquo;효과가 통계적으로 유의하다&amp;rdquo;&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;&lt;b&gt;신뢰구간&lt;/b&gt;&lt;/td&gt;
&lt;td&gt;0 포함 여부&lt;/td&gt;
&lt;td&gt;&amp;ldquo;효과의 방향이 확실하다&amp;rdquo;&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;둘 다 결국 &quot;이 효과가 진짜인가?&quot;를 묻습니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;다만 신뢰구간은 숫자 범위로, t검정은 확률(p값)로 말하는 것뿐이에요.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;7. 왜 이런 검증이 중요한가&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;회귀계수 하나하나가 &quot;변수의 영향력&quot;을 말한다면,&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;t검정과 신뢰구간은 &quot;그 영향력이 믿을 만한가&quot;를 말합니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;즉, &lt;b&gt;&quot;숫자&quot;가 아니라 &quot;근거&quot;를 보는 과정이에요.&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이게 바로 데이터 분석과 단순 통계의 차이죠.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;8. 현실 예시: 품질 개선 프로젝트&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;자동차 도장 공정에서 도막 두께(Y)에 영향을 주는 요인을 분석했습니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&lt;b&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;Y^ &lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span&gt;= &lt;/span&gt;&lt;/span&gt;&lt;span&gt;&lt;span&gt;20.3 &lt;/span&gt;&lt;span&gt;+ &lt;/span&gt;&lt;/span&gt;&lt;span&gt;&lt;span&gt;0.6&lt;/span&gt;&lt;span&gt;&lt;span&gt;X&lt;/span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;₁&lt;/span&gt;&lt;/span&gt;&lt;/span&gt; &lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span&gt;&amp;minus; &lt;/span&gt;&lt;/span&gt;&lt;span&gt;&lt;span&gt;0.8&lt;/span&gt;&lt;span&gt;&lt;span&gt;X&lt;/span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;₂&lt;/span&gt;&lt;/span&gt;&lt;/span&gt; &lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span&gt;&amp;nbsp;&lt;/span&gt;&lt;/span&gt;&lt;span&gt;&lt;span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span&gt;+ &lt;/span&gt;&lt;/span&gt;&lt;/b&gt;&lt;span&gt;&lt;b&gt;&lt;span&gt;0.2&lt;/span&gt;&lt;/b&gt;&lt;span&gt;&lt;b&gt;&lt;span&gt;X&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;₃&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt; &lt;/span&gt;&lt;/b&gt;&lt;/span&gt;&lt;/span&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;변수&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;설명&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;결과&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 해석&lt;/b&gt;&lt;/p&gt;
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody&gt;
&lt;tr&gt;
&lt;td&gt;X₁&lt;/td&gt;
&lt;td&gt;스프레이 압력&lt;/td&gt;
&lt;td&gt;p=0.001&lt;/td&gt;
&lt;td&gt;압력 높을수록 도막 두꺼워짐&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;X₂&lt;/td&gt;
&lt;td&gt;도료 점도&lt;/td&gt;
&lt;td&gt;p=0.000&lt;/td&gt;
&lt;td&gt;점도 높을수록 도막 얇아짐&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;X₃&lt;/td&gt;
&lt;td&gt;작업자 숙련도&lt;/td&gt;
&lt;td&gt;p=0.32&lt;/td&gt;
&lt;td&gt;유의하지 않음 (작업자 간 차이 작음)&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;-&amp;gt; 공정 개선은 압력, 점도 조절에 집중해야 함을 보여줍니다.&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;9. 한 장 요약&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/h3&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;​&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;개념&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 의미&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 해석 기준&lt;/b&gt;&lt;/p&gt;
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody&gt;
&lt;tr&gt;
&lt;td&gt;회귀계수 &amp;beta;&lt;/td&gt;
&lt;td&gt;X가 Y에 주는 영향력&lt;/td&gt;
&lt;td&gt;부호(+, &amp;minus;)와 크기&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;표준오차 SE&lt;/td&gt;
&lt;td&gt;계수의 불확실성&lt;/td&gt;
&lt;td&gt;작을수록 신뢰도 높음&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;t검정&lt;/td&gt;
&lt;td&gt;&amp;ldquo;이 효과가 0이 아닐까?&amp;rdquo;&lt;/td&gt;
&lt;td&gt;p &amp;lt; 0.05면 유의&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;신뢰구간&lt;/td&gt;
&lt;td&gt;효과의 범위&lt;/td&gt;
&lt;td&gt;0 포함 여부 확인&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;결론&lt;/td&gt;
&lt;td&gt;관계의 강도 + 확실성&lt;/td&gt;
&lt;td&gt;둘 다 봐야 진짜 해석 가능&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style1&quot;&gt;&lt;span style=&quot;font-family: 'Noto Serif KR';&quot;&gt;&quot;회귀계수는 관계를 수치로 보여주고,&lt;br /&gt;&lt;/span&gt;신뢰구간은 그 관계를 믿을 수 있는 범위로 보여줍니다.&quot;&lt;/blockquote&gt;</description>
      <category>Statistics/기초 통계</category>
      <category>t검정</category>
      <category>기울기</category>
      <category>기초통계학</category>
      <category>단순회귀</category>
      <category>데이터분석</category>
      <category>데이터사이언스</category>
      <category>신뢰구간</category>
      <category>통계</category>
      <category>회귀계수</category>
      <category>회귀분석</category>
      <author>Allen93</author>
      <guid isPermaLink="true">https://allensdatablog.tistory.com/471</guid>
      <comments>https://allensdatablog.tistory.com/entry/15-%ED%9A%8C%EA%B7%80%EA%B3%84%EC%88%98%EC%9D%98-%EC%9D%98%EB%AF%B8-%EB%8B%A8%EC%88%9C%ED%95%9C-%EC%88%AB%EC%9E%90%EC%97%90%EC%84%9C-%ED%86%B5%EA%B3%84%EC%A0%81-%EA%B7%BC%EA%B1%B0%EB%A1%9C#entry471comment</comments>
      <pubDate>Sat, 17 Jan 2026 11:40:57 +0900</pubDate>
    </item>
    <item>
      <title>14. 회귀분석 - 관계를 수식으로 읽는 방</title>
      <link>https://allensdatablog.tistory.com/entry/14-%ED%9A%8C%EA%B7%80%EB%B6%84%EC%84%9D-%EA%B4%80%EA%B3%84%EB%A5%BC-%EC%88%98%EC%8B%9D%EC%9C%BC%EB%A1%9C-%EC%9D%BD%EB%8A%94-%EB%B0%A9</link>
      <description>&lt;p&gt;&lt;figure class=&quot;imageblock alignCenter&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;1024&quot; data-origin-height=&quot;1536&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/cAc144/dJMcabCw4pi/ZM1NrHCoYEbLhA8MkPIPOK/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/cAc144/dJMcabCw4pi/ZM1NrHCoYEbLhA8MkPIPOK/img.png&quot; data-alt=&quot;회귀분석&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/cAc144/dJMcabCw4pi/ZM1NrHCoYEbLhA8MkPIPOK/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2FcAc144%2FdJMcabCw4pi%2FZM1NrHCoYEbLhA8MkPIPOK%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;488&quot; height=&quot;732&quot; data-origin-width=&quot;1024&quot; data-origin-height=&quot;1536&quot;/&gt;&lt;/span&gt;&lt;figcaption&gt;회귀분석&lt;/figcaption&gt;
&lt;/figure&gt;
&lt;/p&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;1. 데이터는 &quot;관계&quot;를 말한다&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;예를 들어 자동차 회사에서 이런 질문이 나올 수 있습니다.&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;&quot;차량 무게가 연비에 영향을 주는가?&quot;&lt;br /&gt;&quot;엔진 크기가 커질수록 CO2 배출량이 많아지는가?&quot;&lt;br /&gt;&quot;시속이 높을수록 제동거리가 얼마나 길어지는가?&quot;&lt;/blockquote&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이 질문들은 전부 &quot;&lt;b&gt;한 변수가 다른 변수에 어떤 영향을 미치는가&quot;&lt;/b&gt;를 묻는 형태예요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이런 문제를 정량적으로 풀어내는 게 바로 회귀분석입니다.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;2. 회귀의 기본 구조&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;가장 기본형, &lt;b&gt;단순회귀(Simple Regression)&lt;/b&gt;의 식은 이렇게 생겼습니다.&lt;/p&gt;
&lt;p&gt;&lt;figure class=&quot;imageblock alignLeft&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;157&quot; data-origin-height=&quot;42&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/NokVV/dJMcajN6qjd/W2QZDTPtdolbSBoo0kISaK/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/NokVV/dJMcajN6qjd/W2QZDTPtdolbSBoo0kISaK/img.png&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/NokVV/dJMcajN6qjd/W2QZDTPtdolbSBoo0kISaK/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2FNokVV%2FdJMcajN6qjd%2FW2QZDTPtdolbSBoo0kISaK%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;157&quot; height=&quot;42&quot; data-origin-width=&quot;157&quot; data-origin-height=&quot;42&quot;/&gt;&lt;/span&gt;&lt;/figure&gt;
&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;기호&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 의미&lt;/b&gt;&lt;/p&gt;
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody&gt;
&lt;tr&gt;
&lt;td style=&quot;width: 23.2558%;&quot;&gt;Y&lt;/td&gt;
&lt;td style=&quot;width: 76.6279%;&quot;&gt;종속변수 (결과, 예: 연비)&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td style=&quot;width: 23.2558%;&quot;&gt;X&lt;/td&gt;
&lt;td style=&quot;width: 76.6279%;&quot;&gt;독립변수 (원인, 예: 차량 무게)&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td style=&quot;width: 23.2558%;&quot;&gt;&lt;span&gt;&amp;beta;&lt;/span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;0&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/td&gt;
&lt;td style=&quot;width: 76.6279%;&quot;&gt;절편 &amp;mdash; X=0일 때 Y값&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td style=&quot;width: 23.2558%;&quot;&gt;&lt;span&gt;&amp;beta;&lt;/span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;1&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/td&gt;
&lt;td style=&quot;width: 76.6279%;&quot;&gt;기울기(회귀계수) &amp;mdash; X가 1단위 변할 때 Y의 변화량&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td style=&quot;width: 23.2558%;&quot;&gt;&amp;epsilon;&lt;/td&gt;
&lt;td style=&quot;width: 76.6279%;&quot;&gt;오차(예측 불가능한 요인)&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;즉, 자동차의 연비(Y)는&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;'차량 무게(X)'라는 설명 변수와 '예측 불가능한 요소(&amp;epsilon;)'로 구성된다는 뜻이에요.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;3. 기울기의 의미를 직관으로 보자&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;예를 들어 회귀식이 이렇게 나왔다고 해봅시다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;Y^ &lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span&gt;= &lt;/span&gt;&lt;/span&gt;&lt;span&gt;&lt;span&gt;22 &lt;/span&gt;&lt;span&gt;&amp;minus; &lt;/span&gt;&lt;/span&gt;&lt;span&gt;&lt;span&gt;0.005&lt;/span&gt;&lt;span&gt;X&amp;nbsp;&lt;/span&gt;&lt;/span&gt;&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;X : 차량 무게(kg)&lt;/li&gt;
&lt;li&gt;Y : 연비(km/L)&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이 말은 곧,&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;&quot;차량이 100kg 무거워질 때마다 연비가 약 0.5km/L 줄어든다.&quot;&lt;/blockquote&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;즉, &lt;b&gt;기울기(&amp;beta;₁)&lt;/b&gt;가 음수면 -&amp;gt; 반비례 관계&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;양수면 -&amp;gt; 정비례 관계를 의미합니다.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;4. '선' 하나로 세상을 설명할 수 있을까?&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;그래프를 생각해 보죠.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;가로축에 '차량 무게', 세로축에 '연비'를 찍으면 점들이 흩어집니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;회귀분석은 그 점들 사이를 가장 잘 통과하는 '선'을 찾는 과정이에요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이때 '가장 잘 맞는다'의 기준은 &lt;b&gt;오차 제곱의 합이 최소가 되도록 하는 것,&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;바로 &lt;b&gt;최소제곱법(OLS, Ordinary Least Squares)입니다.&lt;/b&gt;&lt;/p&gt;
&lt;p&gt;&lt;figure class=&quot;imageblock alignLeft&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;180&quot; data-origin-height=&quot;40&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/buGnej/dJMcahCKzyX/7VFnsnxOlpEO54unyERed1/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/buGnej/dJMcahCKzyX/7VFnsnxOlpEO54unyERed1/img.png&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/buGnej/dJMcahCKzyX/7VFnsnxOlpEO54unyERed1/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2FbuGnej%2FdJMcahCKzyX%2F7VFnsnxOlpEO54unyERed1%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;180&quot; height=&quot;40&quot; data-origin-width=&quot;180&quot; data-origin-height=&quot;40&quot;/&gt;&lt;/span&gt;&lt;/figure&gt;
&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;쉽게 말하면,&lt;br /&gt;모든 점들과 선의 거리(예측 오차)를 가능한 한 작게 만드는 선을 찾는 것.&lt;/blockquote&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;5. 오차(&amp;epsilon;)의 의미 - 현실이 완벽하지 않다는 사실&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;현실의 데이터는 완벽히 일직선 위에 있지 않아요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;연비는 차량 무게 외에도 엔진 효율, 공기저항, 타이어 상태 등 여러 요인에 영향을 받죠.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이런 &lt;b&gt;설명되지 않는 부분&lt;/b&gt;을 모두 &lt;b&gt;오 차 항(&amp;epsilon;)이&lt;/b&gt; 담당합니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;그래서 회귀식은 &quot;완벽한 예측&quot;이 아니라 &quot;최선의 근사값&quot;을 제공합니다.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;6. 단순회귀 vs 다중회귀&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;구분&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 형태&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;예시&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 의미&lt;/b&gt;&lt;/p&gt;
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody&gt;
&lt;tr&gt;
&lt;td&gt;&lt;b&gt;단순회귀&lt;/b&gt;&lt;/td&gt;
&lt;td&gt;Y = &amp;beta;₀ + &amp;beta;₁X&lt;/td&gt;
&lt;td&gt;연비 ~ 차량무게&lt;/td&gt;
&lt;td&gt;변수 하나의 영향&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;&lt;b&gt;다중회귀&lt;/b&gt;&lt;/td&gt;
&lt;td&gt;Y = &amp;beta;₀ + &amp;beta;₁X₁ + &amp;beta;₂X₂ + ...&lt;/td&gt;
&lt;td&gt;연비 ~ 차량무게 + 엔진배기량 + 타이어마찰계수&lt;/td&gt;
&lt;td&gt;여러 요인의 동시 영향&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;즉, 다중회귀는 &quot;&lt;b&gt;복합적인 현실을 설명하는 선형 모델&quot;&lt;/b&gt;이에요.&lt;br /&gt;자동차의 연비는 단 하나의 요인으로 결정되지 않으니까요.&lt;/blockquote&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;7. 회귀계수의 해석 팁&lt;/h3&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;&lt;b&gt;단위&lt;/b&gt;에 항상 주의하세요.&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 예: 차량 무게(kg) vs 연비(km/L) -&amp;gt; &amp;beta;₁ 단위는 &quot;km/L per kg&quot;&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;&lt;b&gt;절편 &amp;beta;₀&lt;/b&gt;은 의미가 없는 경우도 많아요.&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;(예: 차량 무게 0kg의 연비는 현실적으로 의미가 없죠.)&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;&lt;b&gt; &amp;beta;₁의 부호와 크기&lt;/b&gt;는 인과 방향과 영향력 크기를 직관적으로 보여줍니다.&lt;/li&gt;
&lt;/ul&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;8. 모델의 적합도 : 얼마나 잘 맞았을까?&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;회귀식이 데이터를 잘 설명하는지 평가하는 지표가 &lt;b&gt;결정계수(R&amp;sup2;)&lt;/b&gt;입니다.&lt;/p&gt;
&lt;p&gt;&lt;figure class=&quot;imageblock alignLeft&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;221&quot; data-origin-height=&quot;64&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/bINzE0/dJMcabier2U/dKxEIaV1l8SdYfkOJWTWd1/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/bINzE0/dJMcabier2U/dKxEIaV1l8SdYfkOJWTWd1/img.png&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/bINzE0/dJMcabier2U/dKxEIaV1l8SdYfkOJWTWd1/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2FbINzE0%2FdJMcabier2U%2FdKxEIaV1l8SdYfkOJWTWd1%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;221&quot; height=&quot;64&quot; data-origin-width=&quot;221&quot; data-origin-height=&quot;64&quot;/&gt;&lt;/span&gt;&lt;/figure&gt;
&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;R&amp;sup2; = 0.8 -&amp;gt; &quot;이 모델이 데이터를 80% 설명한다.&quot;&lt;/li&gt;
&lt;li&gt;R&amp;sup2; = 0 -&amp;gt; &quot;설명력 거의 없음.&quot;&lt;/li&gt;
&lt;/ul&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;R&amp;sup2;가 높다고 무조건 좋은 모델은 아닙니다.&lt;br /&gt;너무 많은 변수를 넣으면 R&amp;sup2;는 무조건 올라가요.&lt;br /&gt;그래서 보정된 R&amp;sup2;(Adjusted R&amp;sup2;)도 함께 봅니다.&lt;/blockquote&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;9. 실무 예시로 정리해 보자&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;자동차 회사의 엔진 효율 분석 예시&lt;/b&gt;&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;목적 : 연비(Y)에 영향을 주는 주요 요인 파악&lt;/li&gt;
&lt;li&gt;변수 : 차량 무게(X₁), 엔진 배기량(X₂), 변속기 종류(X₃)&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;결과가 이렇게 나왔다고 합시다;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size18&quot;&gt;&lt;b&gt; &lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;Y&lt;/span&gt;&lt;/span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;^&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span&gt;=&lt;/span&gt;&lt;/span&gt;&lt;span&gt;&lt;span&gt;28.5&lt;/span&gt;&lt;span&gt;&amp;minus;&lt;/span&gt;&lt;/span&gt;&lt;span&gt;&lt;span&gt;0.006&lt;/span&gt;&lt;span&gt;&lt;span&gt;X&lt;/span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;1&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span&gt;​&lt;/span&gt;&lt;/span&gt;&lt;span&gt;&lt;span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span&gt;&amp;minus;&lt;/span&gt;&lt;/span&gt;&lt;span&gt;&lt;span&gt;0.003&lt;/span&gt;&lt;span&gt;&lt;span&gt;X&lt;/span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;2&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span&gt;​&lt;/span&gt;&lt;/span&gt;&lt;span&gt;&lt;span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span&gt;+&lt;/span&gt;&lt;/span&gt;&lt;/b&gt;&lt;span&gt;&lt;b&gt;&lt;span&gt;1&lt;/span&gt;&lt;/b&gt;&lt;span&gt;&lt;b&gt;&lt;span&gt;X&lt;/span&gt;&lt;/b&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;b&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;3&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/b&gt;&lt;span&gt;​&lt;/span&gt;&lt;/span&gt;&lt;span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;차량이 무거울수록 연비 하락&lt;/li&gt;
&lt;li&gt;배기량이 커질수록 연비 하락&lt;/li&gt;
&lt;li&gt;자동변속기(1) 일 때 수동(0)보다 연비 상승&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;즉, 이 모델은 &quot;차가 가벼울수록, 엔진이 작을수록, 자동변속기일수록 연비가 높다&quot;는 결론을 주는 거예요.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;10. 한 장 요약&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;개념&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;의미&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;포인트&lt;/b&gt;&lt;/p&gt;
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody&gt;
&lt;tr&gt;
&lt;td&gt;회귀분석&lt;/td&gt;
&lt;td&gt;변수 간 관계를 수식으로 표현&lt;/td&gt;
&lt;td&gt;&amp;lsquo;관계의 언어&amp;rsquo;&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;기울기 &amp;beta;₁&lt;/td&gt;
&lt;td&gt;X가 1 증가할 때 Y의 변화량&lt;/td&gt;
&lt;td&gt;영향력 크기&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;절편 &amp;beta;₀&lt;/td&gt;
&lt;td&gt;X=0일 때 Y의 예측값&lt;/td&gt;
&lt;td&gt;맥락 따라 무의미할 수도&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;오차 &amp;epsilon;&lt;/td&gt;
&lt;td&gt;예측 불가능한 요인&lt;/td&gt;
&lt;td&gt;현실의 불완전성&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;결정계수 R&amp;sup2;&lt;/td&gt;
&lt;td&gt;모델의 설명력&lt;/td&gt;
&lt;td&gt;높을수록 잘 맞음 (단, 과적합 주의)&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style1&quot;&gt;&lt;span style=&quot;font-family: 'Noto Serif KR';&quot;&gt;&quot;상관은 관계를 보여주지만,&lt;br /&gt;&lt;/span&gt;회귀는 그 관계를 '얼마나'인지를 말해줍니다.&quot;&lt;/blockquote&gt;</description>
      <category>Statistics/기초 통계</category>
      <category>r제곱</category>
      <category>기울기</category>
      <category>기초통계학</category>
      <category>다중회귀</category>
      <category>단순회귀</category>
      <category>데이터분석</category>
      <category>데이터사이언스</category>
      <category>최소제곱법</category>
      <category>통계</category>
      <category>회귀분석</category>
      <author>Allen93</author>
      <guid isPermaLink="true">https://allensdatablog.tistory.com/470</guid>
      <comments>https://allensdatablog.tistory.com/entry/14-%ED%9A%8C%EA%B7%80%EB%B6%84%EC%84%9D-%EA%B4%80%EA%B3%84%EB%A5%BC-%EC%88%98%EC%8B%9D%EC%9C%BC%EB%A1%9C-%EC%9D%BD%EB%8A%94-%EB%B0%A9#entry470comment</comments>
      <pubDate>Wed, 14 Jan 2026 09:24:14 +0900</pubDate>
    </item>
    <item>
      <title>13. 분산분석(ANOVA) - 평균을 비교하는데 왜 분산을 볼까?</title>
      <link>https://allensdatablog.tistory.com/entry/13-%EB%B6%84%EC%82%B0%EB%B6%84%EC%84%9DANOVA-%ED%8F%89%EA%B7%A0%EC%9D%84-%EB%B9%84%EA%B5%90%ED%95%98%EB%8A%94%EB%8D%B0-%EC%99%9C-%EB%B6%84%EC%82%B0%EC%9D%84-%EB%B3%BC%EA%B9%8C</link>
      <description>&lt;p&gt;&lt;figure class=&quot;imageblock alignCenter&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;1024&quot; data-origin-height=&quot;1024&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/bwIWkc/dJMcahpc6fy/OJHGTpc1A6gCXdd4fus5K0/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/bwIWkc/dJMcahpc6fy/OJHGTpc1A6gCXdd4fus5K0/img.png&quot; data-alt=&quot;분산분석&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/bwIWkc/dJMcahpc6fy/OJHGTpc1A6gCXdd4fus5K0/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2FbwIWkc%2FdJMcahpc6fy%2FOJHGTpc1A6gCXdd4fus5K0%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;575&quot; height=&quot;575&quot; data-origin-width=&quot;1024&quot; data-origin-height=&quot;1024&quot;/&gt;&lt;/span&gt;&lt;figcaption&gt;분산분석&lt;/figcaption&gt;
&lt;/figure&gt;
&lt;/p&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;1. 세 집단의 평균을 비교하고 싶은 순간&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;예를 들어 봅시다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;한 업체에서 세 가지 부품 코팅 방식(A, B, C)을 테스트했다고 해요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;각 부품의 &lt;b&gt;내구 시간(단위: 시간)&lt;/b&gt;을 측정했죠.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;결과를 요약하면 아래와 같아요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;코팅&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 평균 수명(시간)&lt;/b&gt;&lt;/p&gt;
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody&gt;
&lt;tr&gt;
&lt;td&gt;A&lt;/td&gt;
&lt;td&gt;3100&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;B&lt;/td&gt;
&lt;td&gt;3150&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;C&lt;/td&gt;
&lt;td&gt;3300&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;자, 질문은 간단합니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;&quot;이 차이가 진짜 의미 있는 걸까,&lt;br /&gt;아니면 샘플이 우연히 이렇게 나온 걸까?&quot;&lt;/blockquote&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;여기서 &lt;b&gt;세 집단의 평균을 한 번에 비교&lt;/b&gt;하는 게&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;바로 &lt;b&gt;분산분석(ANOVA)&lt;/b&gt;입니다.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;2. 그런데 왜 '분산'을 보냐구요?&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;좋은 질문입니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이름부터 '분산분석'이니까 혼란스럽죠.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;근데 그 이유는 간단합니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;평균의 차이를 보려면,&lt;br /&gt;먼저 각 그룹이 얼마나 흩어져 있는지(분산)를 봐야 하기 때문이에요.&lt;/blockquote&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;쉽게 말해,&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;그룹 간 평균이 멀리 떨어져 있고&lt;/li&gt;
&lt;li&gt;그룹 내부의 값들이 고르게 몰려 있다면&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;-&amp;gt;&quot;차이가 진짜로 있다&quot;라고 보는 거예요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;반대로&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;각 그룹 평균은 조금 다르지만&lt;/li&gt;
&lt;li&gt;그룹 내부 값들이 들쭉날쭉하다면&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;-&amp;gt;&quot;이건 우연일 수도 있다&quot;는 거죠.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;3. 분산분석의 핵심 아이디어&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;ANOVA는 데이터를 이렇게 쪼개서 봅니다.&lt;/p&gt;
&lt;h4 data-ke-size=&quot;size20&quot;&gt;&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;전체 변동 = 집단 간 변동 + 집단 내 변동&lt;/h4&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;변동 종류&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;뜻&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 의미&lt;/b&gt;&lt;/p&gt;
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody&gt;
&lt;tr&gt;
&lt;td&gt;&lt;b&gt;집단 간 변동&lt;/b&gt;&lt;/td&gt;
&lt;td&gt;평균들 간의 차이&lt;/td&gt;
&lt;td&gt;코팅 A, B, C가 다를까?&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;&lt;b&gt;집단 내 변동&lt;/b&gt;&lt;/td&gt;
&lt;td&gt;각 그룹 내부의 분산&lt;/td&gt;
&lt;td&gt;같은 코팅 내 부품 간 차이&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이 두 변동의 비율이 바로 &lt;b&gt;F값&lt;/b&gt;이에요.&lt;/p&gt;
&lt;p&gt;&lt;figure class=&quot;imageblock alignCenter&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;152&quot; data-origin-height=&quot;65&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/Tv97j/dJMcahCKfMc/YaI59MaTqM7Ec1PxvKVfr0/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/Tv97j/dJMcahCKfMc/YaI59MaTqM7Ec1PxvKVfr0/img.png&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/Tv97j/dJMcahCKfMc/YaI59MaTqM7Ec1PxvKVfr0/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2FTv97j%2FdJMcahCKfMc%2FYaI59MaTqM7Ec1PxvKVfr0%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;152&quot; height=&quot;65&quot; data-origin-width=&quot;152&quot; data-origin-height=&quot;65&quot;/&gt;&lt;/span&gt;&lt;/figure&gt;
&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;F가 1이면 -&amp;gt; 그룹 간 차이가 거의 없음&lt;/li&gt;
&lt;li&gt;F가 커질수록 -&amp;gt; 그룹 간 차이가 큼 (우연 아님)&lt;/li&gt;
&lt;/ul&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;4. 예시로 직관 잡기&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;세 코팅 A, B, C의 내구 시간 데이터를 시각적으로 보죠.&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;&lt;b&gt;상황 1&lt;/b&gt; : A, B, C 평균이 거의 같고 흩어짐도 큼 -&amp;gt; &quot;차이 없다&quot;&lt;/li&gt;
&lt;li&gt;&lt;b&gt; 상황 2&lt;/b&gt; : A, B, C 평균이 확실히 다르고 각 그룹은 일정 -&amp;gt; &quot;차이 있다&quot;&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;즉, 분산분석은 &quot;평균 간 차이를 분산의 언어로 번역해서 비교하는&quot; 도구예요.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;5. F값이 크면, 그 다음은?&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;F검정으로 &quot;세 그룹 중 적어도 하나는 다르다&quot;는 걸 알 수 있어요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;하지만 &quot;누가 누구랑 다르냐?&quot;는 모릅니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;그래서 그 다음엔 &lt;b&gt;사후검정(Post-hoc test)&lt;/b&gt;을 합니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;Turkey HSD, Scheff&amp;eacute;, Bonferroni 등&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp; &amp;nbsp; -&amp;gt;&quot;B와 C가 유의하게 다르다&quot; 같은 결론을 내줍니다.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;6. 요약으로 딱 잡기&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;포인트&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;설명&lt;/b&gt;&lt;/p&gt;
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody&gt;
&lt;tr&gt;
&lt;td&gt;목적&lt;/td&gt;
&lt;td&gt;세 집단 이상 평균 비교&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;왜 분산을 보나&lt;/td&gt;
&lt;td&gt;평균 차이를 분산의 비율로 판단하기 때문&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;F값&lt;/td&gt;
&lt;td&gt;집단 간 분산 &amp;divide; 집단 내 분산&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;해석&lt;/td&gt;
&lt;td&gt;F&amp;uarr; &amp;rarr; 차이 있음, F&amp;asymp;1 &amp;rarr; 차이 없음&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;후속 절차&lt;/td&gt;
&lt;td&gt;사후검정으로 구체 비교&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;7. 실무 예시&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;1. 공정 개선 실험&lt;/b&gt;&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;세 가지 기계 설정 온도에서 출력률 차이 있는가?&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp; &amp;nbsp;-&amp;gt; 일원분산분석(One-way ANOVA)&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;2. 교육 프로그램 효과 측정&lt;/b&gt;&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;세 가지 교육법이 평균 성적에 영향을 주는가?&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp; &amp;nbsp;-&amp;gt; 일원분산분석 + 사후검정&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;3. 광고 캠페인 실험&lt;/b&gt;&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;세 가지 광고 카피의 전환율 차이 있는가?&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp; &amp;nbsp;-&amp;gt; 비율 기반 ANOVA 또는 변환 후 적용&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;8. 마지막으로&lt;/h3&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;&quot;분산분석은 평균의 대결을 공정하게 만드는 심판이에요.&quot;&lt;/blockquote&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;t검정은 두 집단까지만 비교하지만,&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;ANOVA는 세 집단 이상을 한꺼번에 다뤄요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;그래서 실험 설계나 데이터 분석의 &quot;기본 무기&quot;로 쓰이는 거죠.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;</description>
      <category>Statistics/기초 통계</category>
      <category>ANOVA</category>
      <category>F검정</category>
      <category>기초통계학</category>
      <category>데이터분석</category>
      <category>데이터사이언스</category>
      <category>분산분석</category>
      <category>사후검정</category>
      <category>일원분산분석</category>
      <category>통계</category>
      <author>Allen93</author>
      <guid isPermaLink="true">https://allensdatablog.tistory.com/469</guid>
      <comments>https://allensdatablog.tistory.com/entry/13-%EB%B6%84%EC%82%B0%EB%B6%84%EC%84%9DANOVA-%ED%8F%89%EA%B7%A0%EC%9D%84-%EB%B9%84%EA%B5%90%ED%95%98%EB%8A%94%EB%8D%B0-%EC%99%9C-%EB%B6%84%EC%82%B0%EC%9D%84-%EB%B3%BC%EA%B9%8C#entry469comment</comments>
      <pubDate>Sun, 11 Jan 2026 09:23:58 +0900</pubDate>
    </item>
    <item>
      <title>12. Z, t, &amp;chi;&amp;sup2;, F - 언제 어떤 검정을 써야 할까?</title>
      <link>https://allensdatablog.tistory.com/entry/12-Z-t-%CF%87%C2%B2-F-%EC%96%B8%EC%A0%9C-%EC%96%B4%EB%96%A4-%EA%B2%80%EC%A0%95%EC%9D%84-%EC%8D%A8%EC%95%BC-%ED%95%A0%EA%B9%8C</link>
      <description>&lt;p&gt;&lt;figure class=&quot;imageblock alignCenter&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;1024&quot; data-origin-height=&quot;1024&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/bLW4KR/dJMcagRmdDx/XOoz8AWc3Ec9MUTdrjNkE0/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/bLW4KR/dJMcagRmdDx/XOoz8AWc3Ec9MUTdrjNkE0/img.png&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/bLW4KR/dJMcagRmdDx/XOoz8AWc3Ec9MUTdrjNkE0/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2FbLW4KR%2FdJMcagRmdDx%2FXOoz8AWc3Ec9MUTdrjNkE0%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;466&quot; height=&quot;466&quot; data-origin-width=&quot;1024&quot; data-origin-height=&quot;1024&quot;/&gt;&lt;/span&gt;&lt;/figure&gt;
&lt;/p&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;1. 가설검정의 본질은 &quot;비교&quot;입니다&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;통계 검정은 결국 이런 질문을 던지는 일입니다.&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;&quot;이 차이가 우연일까, 진짜일까?&quot;&lt;/blockquote&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;여기서 &lt;b&gt;무엇을 비교하느냐, 데이터가 어떤 형태냐,&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;모르는 게 무엇이냐(분산?평균?)&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이 세 가지에 따라 검정법이 달라집니다.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;2. 네 가지 검정의 큰 그림&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;검정 종류&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;비교 대상&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;데이터 형태&amp;nbsp; 분산 정보&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 주요 사용 상황&lt;/b&gt;&lt;/p&gt;
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody&gt;
&lt;tr&gt;
&lt;td&gt;&lt;b&gt;Z검정&lt;/b&gt;&lt;/td&gt;
&lt;td&gt;평균&lt;/td&gt;
&lt;td&gt;연속형&lt;/td&gt;
&lt;td&gt;&amp;sigma;(모집단 분산) &lt;b&gt;알고 있음&lt;/b&gt;&lt;/td&gt;
&lt;td&gt;큰 표본, 표준정규 기반&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;&lt;b&gt;t검정&lt;/b&gt;&lt;/td&gt;
&lt;td&gt;평균&lt;/td&gt;
&lt;td&gt;연속형&lt;/td&gt;
&lt;td&gt;&amp;sigma; &lt;b&gt;모름&lt;/b&gt; (표본분산 사용)&lt;/td&gt;
&lt;td&gt;대부분의 실무 비교&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;&lt;b&gt;&amp;chi;&amp;sup2;검정 (카이제곱)&lt;/b&gt;&lt;/td&gt;
&lt;td&gt;비율&amp;middot;빈도&lt;/td&gt;
&lt;td&gt;범주형&lt;/td&gt;
&lt;td&gt;&amp;mdash;&lt;/td&gt;
&lt;td&gt;범주형 독립성&amp;middot;적합도&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;&lt;b&gt;F검정&lt;/b&gt;&lt;/td&gt;
&lt;td&gt;분산&lt;/td&gt;
&lt;td&gt;연속형&lt;/td&gt;
&lt;td&gt;&amp;mdash;&lt;/td&gt;
&lt;td&gt;분산 비교, ANOVA의 기반&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;3. Z vs t - 같은 평균 비교, 다른 전제&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;1. Z검정&lt;/b&gt;&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;&lt;b&gt;모집단 분산 &amp;sigma;&amp;sup2;을 알고 있음&lt;/b&gt; (또는 표본이 매우 큼, n&amp;ge;30)&lt;/li&gt;
&lt;li&gt;표본평균의 분포를 &lt;b&gt;정규분포&lt;/b&gt;로 근사&lt;/li&gt;
&lt;/ul&gt;
&lt;p&gt;&lt;figure class=&quot;imageblock alignLeft&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;106&quot; data-origin-height=&quot;58&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/PHe1c/dJMcaiIphEq/gHLPSNOaDScI8VPkiq06Ck/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/PHe1c/dJMcaiIphEq/gHLPSNOaDScI8VPkiq06Ck/img.png&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/PHe1c/dJMcaiIphEq/gHLPSNOaDScI8VPkiq06Ck/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2FPHe1c%2FdJMcaiIphEq%2FgHLPSNOaDScI8VPkiq06Ck%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;106&quot; height=&quot;58&quot; data-origin-width=&quot;106&quot; data-origin-height=&quot;58&quot;/&gt;&lt;/span&gt;&lt;/figure&gt;
&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;예: &quot;공장에서 생산된 볼트의 평균 길이가 500mm인가?&quot;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;-&amp;gt; &amp;sigma;가 사전에 파악된 공정이라면 Z검정 사용.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;2. t검정&lt;/b&gt;&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;&amp;sigma;를 모르고, 표본분산 s&amp;sup2;으로 추정&lt;/li&gt;
&lt;li&gt;자유도(df)에 따라 &lt;b&gt;t분포&lt;/b&gt; 사용&lt;/li&gt;
&lt;/ul&gt;
&lt;p&gt;&lt;figure class=&quot;imageblock alignLeft&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;108&quot; data-origin-height=&quot;64&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/5YVsb/dJMcabWOKiN/7qgd3kgicA51K9Kcq628gk/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/5YVsb/dJMcabWOKiN/7qgd3kgicA51K9Kcq628gk/img.png&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/5YVsb/dJMcabWOKiN/7qgd3kgicA51K9Kcq628gk/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2F5YVsb%2FdJMcabWOKiN%2F7qgd3kgicA51K9Kcq628gk%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;108&quot; height=&quot;64&quot; data-origin-width=&quot;108&quot; data-origin-height=&quot;64&quot;/&gt;&lt;/span&gt;&lt;/figure&gt;
&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;예: &quot;새 공정의 평균 수명이 기존과 다른가?&quot;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;-&amp;gt; 실험 샘플만 있고 전체 분산은 모를 때 -&amp;gt; t검정.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;현실의 대부분은 &quot; &amp;sigma;를 모르는 상황&quot; -&amp;gt;&lt;b&gt; t검정이 기본값&lt;/b&gt;입니다.&lt;/blockquote&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;4. t검정의 세 가지 형태&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;검정 형태&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 비교 상황&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 예시&lt;/b&gt;&lt;/p&gt;
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody&gt;
&lt;tr&gt;
&lt;td&gt;&lt;b&gt;단일표본 t검정&lt;/b&gt;&lt;/td&gt;
&lt;td&gt;표본평균 vs 특정값&lt;/td&gt;
&lt;td&gt;&amp;ldquo;A부품 평균 강도는 200 이상인가?&amp;rdquo;&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;&lt;b&gt;독립표본 t검정&lt;/b&gt;&lt;/td&gt;
&lt;td&gt;두 집단 평균 비교&lt;/td&gt;
&lt;td&gt;&amp;ldquo;A팀과 B팀의 생산성 차이&amp;rdquo;&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;&lt;b&gt;대응표본 t검정&lt;/b&gt;&lt;/td&gt;
&lt;td&gt;한 집단의 전&amp;middot;후 비교&lt;/td&gt;
&lt;td&gt;&amp;ldquo;시제품 개선 전후 성능 변화&amp;rdquo;&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;독립표본은 서로 다른 그룹, 대응표본은 같은 대상의 변화입니다.&lt;br /&gt;예를 들어 트랙터 테스트 전후 데이터 -&amp;gt; 대응표본.&lt;/blockquote&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;5. &amp;chi;&amp;sup2; 검정 - 비율, 빈도의 싸움&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&quot;성별에 따라 불량률이 다를까?&quot;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&quot;예상한 분포와 실제 빈도가 다를까?&quot;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이런 건 평균이 아니라 비율/빈도의 문제예요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p&gt;&lt;figure class=&quot;imageblock alignLeft&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;167&quot; data-origin-height=&quot;62&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/bGKwZa/dJMcabWOKkh/iFWEweUGetV0eVfdfMGOr1/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/bGKwZa/dJMcabWOKkh/iFWEweUGetV0eVfdfMGOr1/img.png&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/bGKwZa/dJMcabWOKkh/iFWEweUGetV0eVfdfMGOr1/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2FbGKwZa%2FdJMcabWOKkh%2FiFWEweUGetV0eVfdfMGOr1%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;167&quot; height=&quot;62&quot; data-origin-width=&quot;167&quot; data-origin-height=&quot;62&quot;/&gt;&lt;/span&gt;&lt;/figure&gt;
&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;검정 형태&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 의미&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 예시&lt;/b&gt;&lt;/p&gt;
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody&gt;
&lt;tr&gt;
&lt;td&gt;&lt;b&gt;적합도 검정&lt;/b&gt;&lt;/td&gt;
&lt;td&gt;기대빈도와 실제빈도 비교&lt;/td&gt;
&lt;td&gt;&amp;ldquo;지역별 구매비율이 예측과 같은가?&amp;rdquo;&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;&lt;b&gt;독립성 검정&lt;/b&gt;&lt;/td&gt;
&lt;td&gt;두 범주 변수의 관계&lt;/td&gt;
&lt;td&gt;&amp;ldquo;성별과 구매 여부가 독립인가?&amp;rdquo;&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;p값이 작으면 -&amp;gt; &quot;기대한 비율과 다르다&quot;, &quot;독립이 아니다&quot;.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;범주형 데이터에서는 &amp;chi;&amp;sup2;가기본 언어입니다.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;6. F검정 - 분산을 비교하는 문&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;F검정은 두 분산의 비율을 보는 방법입니다.&lt;/p&gt;
&lt;p&gt;&lt;figure class=&quot;imageblock alignLeft&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;91&quot; data-origin-height=&quot;68&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/SErAr/dJMcac2uDfA/Io9YLFU3rnMueIKcEyvbK0/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/SErAr/dJMcac2uDfA/Io9YLFU3rnMueIKcEyvbK0/img.png&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/SErAr/dJMcac2uDfA/Io9YLFU3rnMueIKcEyvbK0/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2FSErAr%2FdJMcac2uDfA%2FIo9YLFU3rnMueIKcEyvbK0%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;91&quot; height=&quot;68&quot; data-origin-width=&quot;91&quot; data-origin-height=&quot;68&quot;/&gt;&lt;/span&gt;&lt;/figure&gt;
&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;F값이 1에 가까우면 -&amp;gt; 두 집단 분산이 유사&lt;/li&gt;
&lt;li&gt;크게 벗어나면 -&amp;gt; &quot;분산이 다르다&quot;&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;F검정은 단독으로도 쓰지만, ANOVA(분산분석)의 핵심 엔진이에요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;즉, &quot;세 집단 이상의 평균 비교&quot;도 결국 F검정을 통해 이뤄집니다.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;7. 현실에서의 조합 예시&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;상황&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 사용 검정&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;이유&lt;/b&gt;&lt;/p&gt;
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody&gt;
&lt;tr&gt;
&lt;td&gt;새 공정의 평균 길이가 50mm인가?&lt;/td&gt;
&lt;td&gt;단일표본 t (또는 Z)&lt;/td&gt;
&lt;td&gt;평균 비교&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;두 기계의 출력이 다르다&lt;/td&gt;
&lt;td&gt;독립표본 t&lt;/td&gt;
&lt;td&gt;두 집단 비교&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;개선 전후 출력 차이&lt;/td&gt;
&lt;td&gt;대응표본 t&lt;/td&gt;
&lt;td&gt;같은 대상 전후&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;남녀에 따라 고장 유형 다름&lt;/td&gt;
&lt;td&gt;&amp;chi;&amp;sup2; 독립성&lt;/td&gt;
&lt;td&gt;범주형 관계&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;세 종류의 재료 평균 강도 비교&lt;/td&gt;
&lt;td&gt;ANOVA (F검정 기반)&lt;/td&gt;
&lt;td&gt;3집단 이상 평균 비교&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style1&quot;&gt;&lt;span style=&quot;font-family: 'Noto Serif KR';&quot;&gt;Z와 t는 &quot;평균의 세계&quot;,&lt;br /&gt;&lt;/span&gt; &amp;chi;&amp;sup2; 와&amp;nbsp; F는 &quot;비율과 분산의 세계&quot;.&lt;br /&gt;어떤 데이터를 다루는지 알면, 검정은 반쯤 끝난 셈이에요.&lt;/blockquote&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;</description>
      <category>Statistics/기초 통계</category>
      <category>ANOVA</category>
      <category>F검정</category>
      <category>t검정</category>
      <category>Z검정</category>
      <category>기초통계학</category>
      <category>데이터분석</category>
      <category>데이터사이언스</category>
      <category>카이제곱검정</category>
      <author>Allen93</author>
      <guid isPermaLink="true">https://allensdatablog.tistory.com/468</guid>
      <comments>https://allensdatablog.tistory.com/entry/12-Z-t-%CF%87%C2%B2-F-%EC%96%B8%EC%A0%9C-%EC%96%B4%EB%96%A4-%EA%B2%80%EC%A0%95%EC%9D%84-%EC%8D%A8%EC%95%BC-%ED%95%A0%EA%B9%8C#entry468comment</comments>
      <pubDate>Thu, 8 Jan 2026 10:32:20 +0900</pubDate>
    </item>
    <item>
      <title>11. 1&amp;middot;2종 오류와 검정력 - 틀리지 않기 위한 설계의 기술</title>
      <link>https://allensdatablog.tistory.com/entry/11-1%C2%B72%EC%A2%85-%EC%98%A4%EB%A5%98%EC%99%80-%EA%B2%80%EC%A0%95%EB%A0%A5-%ED%8B%80%EB%A6%AC%EC%A7%80-%EC%95%8A%EA%B8%B0-%EC%9C%84%ED%95%9C-%EC%84%A4%EA%B3%84%EC%9D%98-%EA%B8%B0%EC%88%A0</link>
      <description>&lt;p&gt;&lt;figure class=&quot;imageblock alignCenter&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;1024&quot; data-origin-height=&quot;1024&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/YfAqL/dJMcajge5Tt/9SvvNEkZfSQc1qgVD492c1/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/YfAqL/dJMcajge5Tt/9SvvNEkZfSQc1qgVD492c1/img.png&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/YfAqL/dJMcajge5Tt/9SvvNEkZfSQc1qgVD492c1/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2FYfAqL%2FdJMcajge5Tt%2F9SvvNEkZfSQc1qgVD492c1%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;600&quot; height=&quot;600&quot; data-origin-width=&quot;1024&quot; data-origin-height=&quot;1024&quot;/&gt;&lt;/span&gt;&lt;/figure&gt;
&lt;/p&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;&amp;nbsp;&lt;/h3&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;1. 두 가지 실수부터 정확히 잡고 가자&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;가설검정은 H₀(차이 없음)를 기본값으로 두고 시작합니다. 여기서 생길 수 있는 실수:&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;실제&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;우리의 판단&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;결과&lt;/b&gt;&lt;/p&gt;
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody&gt;
&lt;tr&gt;
&lt;td&gt;H₀ 참(진짜 차이 없음)&lt;/td&gt;
&lt;td&gt;기각&lt;/td&gt;
&lt;td&gt;&lt;b&gt;1종 오류 (&amp;alpha;)&lt;/b&gt; &amp;mdash; 우연을 진짜로 착각&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;H₀ 거짓(진짜 차이 있음)&lt;/td&gt;
&lt;td&gt;기각 못 함&lt;/td&gt;
&lt;td&gt;&lt;b&gt;2종 오류 (&amp;beta;)&lt;/b&gt; &amp;mdash; 진짜를 놓침&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;&lt;b&gt;유의수준 &amp;alpha;:&lt;/b&gt; 1종 오류를 허용하는 최대 확률(보통 0.05).&lt;/li&gt;
&lt;li&gt;&lt;b&gt;검정력 Power = 1 - &amp;beta;:&lt;/b&gt; 진짜 차이가 있을 때 잡아낼 확률.&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; -&amp;gt; 파워가 0.8(80%)면, &quot;있으면 10번 중 8번 잡는다&quot;는 뜻.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;핵심: &amp;alpha;를 너무 낮추면(엄격) 1종 오류는 줄지만, 2종 오류(&amp;beta;)가 늘어 파워가 떨어집니다. 반대로 &amp;alpha;를 높이면(느슨) 파워는 오르지만 1종 오류 위험이 커집니다. &lt;b&gt;트레이드오프&lt;/b&gt;입니다.&lt;/blockquote&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;2. 검정력을 키우는 네 가지 레버&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;1. 표본크기 n&amp;uarr; &amp;rarr; Power&amp;uarr; &lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp; &amp;nbsp;표준오차가 줄어 차이를 더 잘 구분.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;2. 효과크기(Effect size) &amp;uarr; -&amp;gt; Power &amp;uarr; &lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp; &amp;nbsp;차이가 클수록 잡아내기 쉬움. (예: 평균 차이 1.0 vs 0.2)&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;3. 변동성 &amp;sigma;&amp;darr; -&amp;gt; Power&amp;uarr; &lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp; &amp;nbsp;데이터가 덜 흔들리면 신호/노이즈 비가 좋아짐. (측정 정밀도/분산 감소)&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;4. 유의 수준 &amp;alpha; &amp;darr; -&amp;gt; Power &amp;uarr; &lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp; &amp;nbsp;임계값이 느슨해져 검정 통과가 쉬워짐. (대신 1종 오류 &amp;uarr;)&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;실무 팁 : n과 분산은 우리가 직접 손댈 수 있는 레버입니다.&lt;br /&gt;더 많은 표본, 더 일관된 측정(노이즈 줄이기)이 파워를 올리는 가장 안전한 방법.&lt;/blockquote&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;3. 두 상황으로 감 잡기&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;A. 품질개선 : 불량률 2% -&amp;gt; 1.5%로 낮췄는지 검정&lt;/b&gt;&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;H₀: p = 0.02, H₁: p &amp;lt; 0.02&lt;/li&gt;
&lt;li&gt;알파 0.05, 목표 파워 0.8로 설계하려면?&lt;br /&gt;대략적인 필요 표본 수(비율 비교 러프 공식):&lt;/li&gt;
&lt;/ul&gt;
&lt;p&gt;&lt;figure class=&quot;imageblock alignLeft&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;351&quot; data-origin-height=&quot;64&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/dgmfNG/dJMcadAknXe/EYra1YKyQuXvJJH1KaBwGK/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/dgmfNG/dJMcadAknXe/EYra1YKyQuXvJJH1KaBwGK/img.png&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/dgmfNG/dJMcadAknXe/EYra1YKyQuXvJJH1KaBwGK/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2FdgmfNG%2FdJMcadAknXe%2FEYra1YKyQuXvJJH1KaBwGK%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;351&quot; height=&quot;64&quot; data-origin-width=&quot;351&quot; data-origin-height=&quot;64&quot;/&gt;&lt;/span&gt;&lt;/figure&gt;
&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;p0=0.02,  p1=0.015,  z0.95&amp;asymp;1.645,  z0.8&amp;asymp;0.84p_0=0.02,\; p_1=0.015,\; z_{0.95}\approx1.645,\; z_{0.8}\approx0.84&lt;span aria-hidden=&quot;true&quot;&gt;p0​=0.02,p1​=0.015,z0.95​&amp;asymp;1.645,z0.8​&amp;asymp;0.84&lt;/span&gt;&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;span aria-hidden=&quot;true&quot;&gt;&lt;span&gt;&lt;span&gt;&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;-&amp;gt; 대략 수천 단위 표본이 표본이 필요(희소 사건의 작은 개선은 큰 n을 요구).&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;메시지: 작은 개선(효과크기 &lt;b&gt;&amp;darr;&lt;/b&gt;) + 드문 사건(p 작음)일수록 &lt;b&gt;n 폭증.&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;B. A/B 테스트 전환율 5.0% vs 5.6%&lt;/b&gt;&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;차이 0.6%p는 작아 보이지만, 상대 12% 상승.&lt;/li&gt;
&lt;li&gt;전형적 세팅(&amp;alpha;=0.05, 파워 0.8)에서 양군 동일 n일 때,&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 전환율 5~6%대 비교는 수천~만 단위 노출이 흔합니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;메시지:&lt;/b&gt; 마케팅 개선은 보통 소효과 -&amp;gt; 표본 많이 필요.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;4. 효과크기를 숫자로 말하기 (감각 고정)&lt;/h3&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;평균 비교(t-test): &lt;span aria-hidden=&quot;true&quot;&gt;d=&amp;sigma;&amp;mu;1​&amp;minus;&amp;mu;2 / ​​&lt;/span&gt; (Cohen&amp;rsquo;s d)
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;d&amp;asymp;0.2(작음), 0.5(중간), 0.8(큼) &amp;mdash; 대략 감&lt;/li&gt;
&lt;/ul&gt;
&lt;/li&gt;
&lt;li&gt;비율 비교: 절대 차이(&amp;Delta;p)와 오즈비(OR)를 함께 보되, 보고서에는 신뢰구간을 꼭 병기.&lt;/li&gt;
&lt;/ul&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;효과크기를 먼저 가늠하면, 파워 계산이 현실적인지 빨리 판단할 수 있습니다.&lt;/blockquote&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;5. 양측 vs 단측 검정, 그리고 파워&lt;/h3&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;&lt;b&gt; 양측(&amp;ne;):&lt;/b&gt; 양쪽 꼬리를 다 본다 -&amp;gt; 임계값이 더 엄격 -&amp;gt; 같은 n에서 &lt;b&gt;파워 &amp;darr; &lt;/b&gt;&lt;/li&gt;
&lt;li&gt;&lt;b&gt;단측(&amp;gt;,&amp;lt;):&lt;/b&gt; 한쪽만 본다 -&amp;gt; 임계값 느슨 -&amp;gt; &lt;b&gt;파워 &amp;uarr; &lt;/b&gt;&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;단, &lt;b&gt;단측은 사전 가정이 명확하고 반대 방향 결과엔 관심이 없을 때만&lt;/b&gt; 사용.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;보고서에 검정 방향을 분명히 명기하세요.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;6. 표본크기 산정, 최소 체크리스트&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;1. 효과크기 가정 :&lt;/b&gt; 비지니스/엔지니어링적으로 의미 있는 최소 차이(MID) 정의&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;2. 변동성 추정:&lt;/b&gt; 과거 데이터로 &amp;sigma; 또는 p(1-p) 추정&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;3. &amp;alpha;, 파워 설정:&lt;/b&gt; 보통 &amp;alpha;=0.05, 파워 &amp;gt;=0.8(품질/의료는 0.9도 고려)&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;4. 손실/누락률 고려:&lt;/b&gt; 실험 누락, 결측 대비 10~20% 여유&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;5. 현실 제약 반영:&lt;/b&gt; 기간, 비용, 샘플링 가능성&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;파워가 너무 낮으면, &quot;차이가 없음&quot;이 아니라 &quot;검출 능력이 부족&quot;일 수 있습니다. 보고서에 파워를 함께 제시하세요.&lt;/blockquote&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;7. 최소 공식 두 개 (현업 감각용 러프 버전)&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;평균 차이(등분산 가정, 양군 동일 n)&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;평균 차이(등분산 가정, 양군 동일 n)&lt;/p&gt;
&lt;p&gt;&lt;figure class=&quot;imageblock alignLeft&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;202&quot; data-origin-height=&quot;69&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/dFsfrt/dJMcahQgnfx/rz81CGryj5wxMKVR7Plsq1/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/dFsfrt/dJMcahQgnfx/rz81CGryj5wxMKVR7Plsq1/img.png&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/dFsfrt/dJMcahQgnfx/rz81CGryj5wxMKVR7Plsq1/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2FdFsfrt%2FdJMcahQgnfx%2Frz81CGryj5wxMKVR7Plsq1%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;202&quot; height=&quot;69&quot; data-origin-width=&quot;202&quot; data-origin-height=&quot;69&quot;/&gt;&lt;/span&gt;&lt;/figure&gt;
&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;Delta;: 탐지하고 싶은 평균 차이, &amp;sigma;:표준편차&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;비율 차이(양군 동일 n)&lt;/p&gt;
&lt;p&gt;&lt;figure class=&quot;imageblock alignLeft&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;454&quot; data-origin-height=&quot;69&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/zwBSV/dJMcafZdntv/D4IsiqrGD4INN6EbJUpeW0/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/zwBSV/dJMcafZdntv/D4IsiqrGD4INN6EbJUpeW0/img.png&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/zwBSV/dJMcafZdntv/D4IsiqrGD4INN6EbJUpeW0/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2FzwBSV%2FdJMcafZdntv%2FD4IsiqrGD4INN6EbJUpeW0%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;454&quot; height=&quot;69&quot; data-origin-width=&quot;454&quot; data-origin-height=&quot;69&quot;/&gt;&lt;/span&gt;&lt;/figure&gt;
&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;p&amp;circ; = (p1 + p2) / 2&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;정확한 설계는 전문 도구(G*Power, statsmodels 등)로 검증하시고, 위 식은 초기 견적/감 잡기에 쓰세요.&lt;/blockquote&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;8. 보고서에 이렇게 쓰면 깔끔하다&lt;/h3&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;&quot;유의수준 0.05, 양측 검정.&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp; &amp;nbsp; &amp;nbsp;예상 효과크기 d=0.4, 목표 파워 0.8 기준 필요한 표본 수는 각 군 98명.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp; &amp;nbsp; &amp;nbsp;결측 10% 감안해 각 군 110명 모집 예정.&quot;&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;결과: &quot;p=0.03, 효과크기 d=0.41, 95% CI [0.10, 0.72].&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp; &amp;nbsp; &amp;nbsp;통계적으로 유의하며, 실무 임계치(&amp;gt;=0.3)도 충족.&quot;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;포인트&lt;/b&gt; : p값, 효과크기, 신뢰구간, 파워/표본 설계 근거 - 네 세트를 한 번에.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;9. 한 장 요약&lt;/h3&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;&lt;b&gt; &amp;alpha;(1종) vs &amp;beta;(2종):&lt;/b&gt; 한쪽을 줄이면 다른 쪽이 늘어난다.&lt;/li&gt;
&lt;li&gt;&lt;b&gt;POWER = 1- &amp;beta;:&lt;/b&gt; 진짜 차이가 있을 때 잡아낼 확률. 보통 0.8 이상.&lt;/li&gt;
&lt;li&gt;파워 올리는 법: &lt;b&gt;n&amp;uarr;, 효과크기&amp;uarr;, &amp;sigma;&amp;darr;, &amp;alpha;&amp;uarr;(주의), 단측 검정(조건부).&lt;/b&gt;&lt;/li&gt;
&lt;li&gt;&lt;b&gt;효과크기 가정&lt;/b&gt;과 &lt;b&gt;표본크기 산정&lt;/b&gt;이 설계의 핵심.&lt;/li&gt;
&lt;li&gt;결과 보고는 &lt;b&gt;p값, 효과크기 + 신뢰구간 + 설계&lt;/b&gt; 요약으로 완성.&lt;/li&gt;
&lt;/ul&gt;
&lt;blockquote data-ke-style=&quot;style1&quot;&gt;&lt;span style=&quot;font-family: 'Noto Serif KR';&quot;&gt;가설검정은 &quot;있다/없다&quot;를 누르는 버튼이 아닙니다.&lt;/span&gt;&lt;br /&gt;&lt;span style=&quot;font-family: 'Noto Serif KR';&quot;&gt;틀릴 가능성을 관리하는 설계의 기술이에요.&lt;/span&gt;&lt;/blockquote&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;</description>
      <category>Statistics/기초 통계</category>
      <category>1종오류</category>
      <category>2종오류</category>
      <category>검정력</category>
      <category>기초통계학</category>
      <category>데이터분석</category>
      <category>데이터사이언스</category>
      <category>유의수준</category>
      <category>통계</category>
      <category>표본크기</category>
      <category>효과크기</category>
      <author>Allen93</author>
      <guid isPermaLink="true">https://allensdatablog.tistory.com/467</guid>
      <comments>https://allensdatablog.tistory.com/entry/11-1%C2%B72%EC%A2%85-%EC%98%A4%EB%A5%98%EC%99%80-%EA%B2%80%EC%A0%95%EB%A0%A5-%ED%8B%80%EB%A6%AC%EC%A7%80-%EC%95%8A%EA%B8%B0-%EC%9C%84%ED%95%9C-%EC%84%A4%EA%B3%84%EC%9D%98-%EA%B8%B0%EC%88%A0#entry467comment</comments>
      <pubDate>Mon, 5 Jan 2026 17:34:34 +0900</pubDate>
    </item>
    <item>
      <title>10. 유의수준과 가설검정 - 우연과 진짜의 경계</title>
      <link>https://allensdatablog.tistory.com/entry/10-%EC%9C%A0%EC%9D%98%EC%88%98%EC%A4%80%EA%B3%BC-%EA%B0%80%EC%84%A4%EA%B2%80%EC%A0%95-%EC%9A%B0%EC%97%B0%EA%B3%BC-%EC%A7%84%EC%A7%9C%EC%9D%98-%EA%B2%BD%EA%B3%84</link>
      <description>&lt;h3 data-ke-size=&quot;size23&quot;&gt;1. &quot;이 차이는 우연일까, 진짜일까?&quot;&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;자동차 부품 A와 B의 내구성을 비교한다고 해볼게요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;A 는 평균 3,000시간, B는 평균 3,100시간.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;100시간 차이가 납니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이제 질문은 하나예요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;&quot;이 차이가 진짜 성능 차이일까,&lt;br /&gt;아니면 우연히 생긴 오차일까?&quot;&lt;/blockquote&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;그 판단을 돕는 절차가 바로 &lt;b&gt;가설검정(Hypothesis Testing)&lt;/b&gt; 입니다.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;2. 가설검정의 기본 구조&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;모든 가설검정은 두 가지 가정에서 시작합니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;구분&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 이름&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 의미&lt;/b&gt;&lt;/p&gt;
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody&gt;
&lt;tr&gt;
&lt;td&gt;&lt;b&gt;귀무가설 (H₀)&lt;/b&gt;&lt;/td&gt;
&lt;td&gt;Null Hypothesis&lt;/td&gt;
&lt;td&gt;&amp;ldquo;차이가 없다&amp;rdquo;는 기본 입장&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;&lt;b&gt;대립가설 (H₁)&lt;/b&gt;&lt;/td&gt;
&lt;td&gt;Alternative Hypothesis&lt;/td&gt;
&lt;td&gt;&amp;ldquo;차이가 있다&amp;rdquo;는 주장&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;예를 들어,&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;H₀: A와 B의 평균 수명은 같다 (&amp;mu;A = &amp;mu;B)&lt;br /&gt;H₁: A와 B의 평균 수명은 다르다 (&amp;mu;A &amp;ne; &amp;mu;B)&lt;/blockquote&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;가설검정은 이 &lt;b&gt;H₀를 일단 참이라고 가정&lt;/b&gt;하고,&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;데이터가 그 논리를 부술 만큼 강력한 근거를 주는지 확인하는 절차예요.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;3. 유의수준(&amp;alpha;)의 의미&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;유의수준은 &lt;b&gt;우연을 받아들일 한계선&lt;/b&gt;이에요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;가장 많이 쓰는 기준은 &amp;alpha; = 0.05 (5%).&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;즉,&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;&quot;데이터가 이렇게 극단적인 확률이 5%보다 작다면,&lt;br /&gt;단순한 우연으로 보기 어렵다 -&amp;gt; H₀를 기각한다.&quot;&lt;/blockquote&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;유의수준&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 해석&lt;/b&gt;&lt;/p&gt;
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody&gt;
&lt;tr&gt;
&lt;td&gt;0.10&lt;/td&gt;
&lt;td&gt;비교적 느슨함 (탐색적 연구)&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;0.05&lt;/td&gt;
&lt;td&gt;일반적 기준&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;0.01&lt;/td&gt;
&lt;td&gt;매우 엄격한 기준 (의학, 품질 등)&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;4. p-value, 숫자에 담긴 메시지&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;p-value는 &quot;데이터가 이렇게 나올 확률&quot;이에요.&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;&quot;귀무가설이 참이라면, 이런 결과(또는 더 극단적인 결과)가 우연히 날 확률이 얼마나 될까?&quot;&lt;/blockquote&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;p-value&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;해석&lt;/b&gt;&lt;/p&gt;
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody&gt;
&lt;tr&gt;
&lt;td&gt;&amp;lt; 0.05&lt;/td&gt;
&lt;td&gt;우연으로 보기 어렵다 &amp;rarr; H₀ 기각&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;&amp;ge; 0.05&lt;/td&gt;
&lt;td&gt;우연일 수 있다 &amp;rarr; H₀ 유지(기각 못 함)&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;예를 들어, p=0.03이면?&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&quot;이 결과가 우연히 생길 확률은 3%밖에 안 되니까, 진짜 차이일 가능성이 높다.&quot;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;p-value는 &quot;확률&quot;이 아니라 &quot;증거의 강도&quot;예요.&lt;br /&gt;작을수록 귀무가설을 흔드는 힘이 강하다는 뜻이죠.&lt;/blockquote&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;5. 오류의 두 얼굴: 1종과 2종&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;가설검정은 완벽하지 않아요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;두 가지 종류의 실수를 저지를 수 있습니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;구분&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;설명&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;결과&lt;/b&gt;&lt;/p&gt;
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody&gt;
&lt;tr&gt;
&lt;td&gt;&lt;b&gt;1종 오류 (Type I)&lt;/b&gt;&lt;/td&gt;
&lt;td&gt;사실은 H₀가 맞는데 기각함&lt;/td&gt;
&lt;td&gt;&amp;ldquo;우연인데 차이 있다고 착각&amp;rdquo;&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;&lt;b&gt;2종 오류 (Type II)&lt;/b&gt;&lt;/td&gt;
&lt;td&gt;사실은 H₀가 틀렸는데 기각 못 함&lt;/td&gt;
&lt;td&gt;&amp;ldquo;진짜 차이인데 눈치 못 챔&amp;rdquo;&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;유의수준 &amp;alpha;는 &lt;b&gt;1종 오류를 허용하는 최대 확률&lt;/b&gt;이에요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;즉, &quot;우연을 진짜라고 착각할 확률을 5%까지만 허용하겠다&quot;는 뜻이죠.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;6. 실제 예시로 보는 가설검정&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;예시 1. 신제품 부품 내구성 테스트&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;1851&quot; data-start=&quot;1825&quot;&gt;H₀: 신제품의 평균 수명 = 기존 제품&lt;/li&gt;
&lt;li data-end=&quot;1878&quot; data-start=&quot;1852&quot;&gt;H₁: 신제품의 평균 수명 &amp;gt; 기존 제품&lt;/li&gt;
&lt;li data-end=&quot;1944&quot; data-start=&quot;1879&quot;&gt;실험 결과 p=0.02 &amp;rarr; 0.05보다 작음&lt;br /&gt;&amp;rarr; &lt;b&gt;H₀ 기각, 신제품이 통계적으로 더 오래간다고 판단&lt;/b&gt;&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;예시 2. 마케팅 A/B테스트&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;1992&quot; data-start=&quot;1971&quot;&gt;H₀: 두 광고의 클릭률은 같다&lt;/li&gt;
&lt;li data-end=&quot;2004&quot; data-start=&quot;1993&quot;&gt;H₁: 다르다&lt;/li&gt;
&lt;li data-end=&quot;2065&quot; data-start=&quot;2005&quot;&gt;p=0.13 &amp;rarr; 0.05보다 큼&lt;br /&gt;&amp;rarr; &lt;b&gt;H₀ 기각 불가&lt;/b&gt;, 즉 &amp;ldquo;확실히 다르다고는 말 못 함.&amp;rdquo;&lt;/li&gt;
&lt;/ul&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;통계적 유의미함(statistical significance) &amp;ne; 실제 중요성(practical significance)&lt;br /&gt;-&amp;gt; p값이 작다고 해서 비지니스 임팩트가 크다는 뜻은 아니에요.&lt;/blockquote&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;7. 시각적으로 이해하기&lt;/h3&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;정규분포 곡선 아래의 꼬리 부분이 유의수준(&amp;alpha;)&lt;/li&gt;
&lt;li&gt;p-value는 실제 데이터가 어느 쪽까지 밀려났는지를 나타냄&lt;/li&gt;
&lt;li&gt;p가 &amp;alpha;보다 작으면 &quot;귀무가설 구역&quot;을 벗어남 -&amp;gt; 기각&lt;/li&gt;
&lt;li&gt;&lt;figure class=&quot;imageblock alignLeft&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;1024&quot; data-origin-height=&quot;1024&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/uAfsR/dJMcagcKaYN/YCnULhXLAZz4P3mCBqQIF1/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/uAfsR/dJMcagcKaYN/YCnULhXLAZz4P3mCBqQIF1/img.png&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/uAfsR/dJMcagcKaYN/YCnULhXLAZz4P3mCBqQIF1/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2FuAfsR%2FdJMcagcKaYN%2FYCnULhXLAZz4P3mCBqQIF1%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;609&quot; height=&quot;609&quot; data-origin-width=&quot;1024&quot; data-origin-height=&quot;1024&quot;/&gt;&lt;/span&gt;&lt;/figure&gt;
&lt;/li&gt;
&lt;/ul&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;8. 한 장 요약&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;개념&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 설명&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 핵심 포인트&lt;/b&gt;&lt;/p&gt;
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody&gt;
&lt;tr&gt;
&lt;td&gt;귀무가설 (H₀)&lt;/td&gt;
&lt;td&gt;차이가 없다&lt;/td&gt;
&lt;td&gt;기본 입장&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;대립가설 (H₁)&lt;/td&gt;
&lt;td&gt;차이가 있다&lt;/td&gt;
&lt;td&gt;우리가 검증하고 싶은 주장&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;유의수준 (&amp;alpha;)&lt;/td&gt;
&lt;td&gt;우연을 허용하는 기준&lt;/td&gt;
&lt;td&gt;보통 0.05&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;p-value&lt;/td&gt;
&lt;td&gt;데이터가 이렇게 나올 확률&lt;/td&gt;
&lt;td&gt;작을수록 H₀가 흔들림&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;1종 오류&lt;/td&gt;
&lt;td&gt;H₀ 참인데 기각&lt;/td&gt;
&lt;td&gt;&amp;ldquo;우연을 진짜로 착각&amp;rdquo;&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;2종 오류&lt;/td&gt;
&lt;td&gt;H₀ 거짓인데 유지&lt;/td&gt;
&lt;td&gt;&amp;ldquo;진짜를 못 알아봄&amp;rdquo;&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style1&quot;&gt;&lt;span style=&quot;font-family: 'Noto Serif KR';&quot;&gt;&quot;가설검정은 정답을 찾는 게 아니라,&lt;br /&gt;&lt;/span&gt;'데이터가 말이 되는가'를 묻는 과정이에요.&quot;&lt;/blockquote&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;</description>
      <category>Statistics/기초 통계</category>
      <category>p값</category>
      <category>가설검정</category>
      <category>기초통계학</category>
      <category>데이터분석</category>
      <category>데이터사이언스</category>
      <category>유의수준</category>
      <category>통계</category>
      <category>통계적유의성</category>
      <author>Allen93</author>
      <guid isPermaLink="true">https://allensdatablog.tistory.com/466</guid>
      <comments>https://allensdatablog.tistory.com/entry/10-%EC%9C%A0%EC%9D%98%EC%88%98%EC%A4%80%EA%B3%BC-%EA%B0%80%EC%84%A4%EA%B2%80%EC%A0%95-%EC%9A%B0%EC%97%B0%EA%B3%BC-%EC%A7%84%EC%A7%9C%EC%9D%98-%EA%B2%BD%EA%B3%84#entry466comment</comments>
      <pubDate>Thu, 1 Jan 2026 10:21:40 +0900</pubDate>
    </item>
    <item>
      <title>9. 점추정과 구간추정 - 숫자 하나에 담긴 '불확실함의 크기'</title>
      <link>https://allensdatablog.tistory.com/entry/9-%EC%A0%90%EC%B6%94%EC%A0%95%EA%B3%BC-%EA%B5%AC%EA%B0%84%EC%B6%94%EC%A0%95-%EC%88%AB%EC%9E%90-%ED%95%98%EB%82%98%EC%97%90-%EB%8B%B4%EA%B8%B4-%EB%B6%88%ED%99%95%EC%8B%A4%ED%95%A8%EC%9D%98-%ED%81%AC%EA%B8%B0</link>
      <description>&lt;p&gt;&lt;figure class=&quot;imageblock alignCenter&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;1024&quot; data-origin-height=&quot;1024&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/bXMCkj/dJMcain5FFc/NBpv4Y3riOEjfEXH7xf9h0/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/bXMCkj/dJMcain5FFc/NBpv4Y3riOEjfEXH7xf9h0/img.png&quot; data-alt=&quot;신뢰구간&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/bXMCkj/dJMcain5FFc/NBpv4Y3riOEjfEXH7xf9h0/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2FbXMCkj%2FdJMcain5FFc%2FNBpv4Y3riOEjfEXH7xf9h0%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;450&quot; height=&quot;450&quot; data-origin-width=&quot;1024&quot; data-origin-height=&quot;1024&quot;/&gt;&lt;/span&gt;&lt;figcaption&gt;신뢰구간&lt;/figcaption&gt;
&lt;/figure&gt;
&lt;/p&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;&amp;nbsp;&lt;/h3&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;1. 우리는 결국 &quot;모집단&quot;을 직접 볼 수 없습니다&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;통계학의 출발점은 늘 똑같아요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;&quot;모든 데이터를 다 볼 수 없을 때,&lt;br /&gt;일부만 보고 전체를 어떻게 추론할 것인가?&quot;&lt;/blockquote&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;예를 들어,&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;자동차 엔진 10,000대의 실제 평균 수명을 알고 싶어요.&lt;/li&gt;
&lt;li&gt;하지만 전부 테스트할 순 없으니 50대만 시험합니다.&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;그럼 우리는 이 50대의 평균으로 &lt;b&gt;모집단 평균을 '추정'&lt;/b&gt;하게 됩니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이게 바로 통계적 추론의 출발이에요.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;2. 점추정 : 숫자 하나로 대표하는 세상&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;점추정(Point Estimation)&lt;/b&gt;은 말 그대로&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;모집단의 특성을 하나의 숫자로 추정하는 방법이에요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;모집단 특성&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;표본으로 추정하는 값&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 기호&lt;/b&gt;&lt;/p&gt;
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody&gt;
&lt;tr&gt;
&lt;td style=&quot;width: 34.4186%;&quot;&gt;모집단 평균 (&amp;mu;)&lt;/td&gt;
&lt;td style=&quot;width: 44.4186%;&quot;&gt;표본 평균&lt;/td&gt;
&lt;td style=&quot;width: 20.9302%;&quot;&gt;&lt;b&gt;x̄&lt;span&gt;&amp;nbsp;&lt;/span&gt;&lt;/b&gt;&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td style=&quot;width: 34.4186%;&quot;&gt;모집단 비율 (p)&lt;/td&gt;
&lt;td style=&quot;width: 44.4186%;&quot;&gt;표본 비율&lt;/td&gt;
&lt;td style=&quot;width: 20.9302%;&quot;&gt;p&amp;circ;&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td style=&quot;width: 34.4186%;&quot;&gt;모집단 분산 (&amp;sigma;&amp;sup2;)&lt;/td&gt;
&lt;td style=&quot;width: 44.4186%;&quot;&gt;표본 분산&lt;/td&gt;
&lt;td style=&quot;width: 20.9302%;&quot;&gt;S&amp;sup2;&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;즉, 표본평균 &lt;b&gt;x̄&lt;span&gt;&amp;nbsp;&lt;/span&gt;&lt;/b&gt; 은 모집단평균 &amp;mu;의 &lt;b&gt;점추정량(estimator)&lt;/b&gt;이에요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;&quot;표본이 모집단을 대신하는 하나의 대표 숫자.&quot;&lt;/blockquote&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;예를 들어, 50대의 평균 수명이 3,150시간이라면&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;우리는 &quot;엔진의 평균 수명은 약 3,150시간이다&quot;라고 말하죠.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;하지만 여기서 문제가 하나 생깁니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;그 숫자 하나가 얼마나 믿을 만할까?&lt;/b&gt;&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;3. 구간추정 : 불확실성을 인정하는 법&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;점추정은 깔끔하지만 불안합니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;표본이 다르면 평균도 달라지니까요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;그래서 통계학은 이렇게 말하죠.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;&quot;숫자 하나로 말하지 말고,&lt;br /&gt;믿을 수 있는 구간을 함께 제시하자.&quot;&lt;/blockquote&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이게 바로 &lt;b&gt;구간추정(Interval Estimation)&lt;/b&gt;입니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;가장 흔한 형태가 신뢰구간&lt;b&gt;(Confidence Interval, CI)&lt;/b&gt;이에요.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;4. 신뢰구간의 정의&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;신뢰구간은 이렇게 생겼어요.&lt;/p&gt;
&lt;p&gt;&lt;figure class=&quot;imageblock alignLeft&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;126&quot; data-origin-height=&quot;56&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/bM5FUh/dJMcab3zsQ3/9RjcgH7yofTMoUgc8Y9aj1/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/bM5FUh/dJMcab3zsQ3/9RjcgH7yofTMoUgc8Y9aj1/img.png&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/bM5FUh/dJMcab3zsQ3/9RjcgH7yofTMoUgc8Y9aj1/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2FbM5FUh%2FdJMcab3zsQ3%2F9RjcgH7yofTMoUgc8Y9aj1%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;126&quot; height=&quot;56&quot; data-origin-width=&quot;126&quot; data-origin-height=&quot;56&quot;/&gt;&lt;/span&gt;&lt;/figure&gt;
&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;기호&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;의미&lt;/b&gt;&lt;/p&gt;
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody&gt;
&lt;tr&gt;
&lt;td&gt;x̄&amp;nbsp;&amp;nbsp;&lt;/td&gt;
&lt;td&gt;표본평균&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;(Z a/2)&lt;/td&gt;
&lt;td&gt;정규분포에서의 임계값 (예: 1.96 for 95%)&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;(\frac{\sigma}{\sqrt{n}})&lt;/td&gt;
&lt;td&gt;표준오차(표본평균의 불확실성)&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;예를 들어,&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;표본평균 3,150시간&lt;/li&gt;
&lt;li&gt;표준편차 100시간&lt;/li&gt;
&lt;li&gt;표본 크기 50&lt;/li&gt;
&lt;li&gt;신뢰수준 95%&lt;/li&gt;
&lt;/ul&gt;
&lt;p&gt;&lt;figure class=&quot;imageblock alignLeft&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;325&quot; data-origin-height=&quot;71&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/bET1Kr/dJMcaj1Bw53/DhcTKS61BSMeoFVPjR9k5k/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/bET1Kr/dJMcaj1Bw53/DhcTKS61BSMeoFVPjR9k5k/img.png&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/bET1Kr/dJMcaj1Bw53/DhcTKS61BSMeoFVPjR9k5k/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2FbET1Kr%2FdJMcaj1Bw53%2FDhcTKS61BSMeoFVPjR9k5k%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;325&quot; height=&quot;71&quot; data-origin-width=&quot;325&quot; data-origin-height=&quot;71&quot;/&gt;&lt;/span&gt;&lt;/figure&gt;
&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;즉,&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;&quot;이 엔진의 평균 수명은 3,122시간에서 3,178시간 사이에 있을 것이다.&quot;&lt;/blockquote&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;5. 신뢰수준 95%의 진짜 뜻&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;많은 사람들이 오해하는 부분이에요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;&quot;95% 확률로 평균이 저 안에 있다&quot;&lt;/b&gt;가 아닙니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;정확한 의미는 이렇습니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&quot;이 과정을 100번 반복한다면,&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;그 중 약 95번은 진짜 평균을 포함할 것이다.&quot;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;즉, 신뢰구간은 '단 한번의 확률'이 아니라&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;'반복적 실험에서의 안정성'을 뜻해요.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;6. 신뢰구간이 좁다는 건 좋은 신호일까?&quot;&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;보통은 맞습니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;신뢰구간이 좁을수록 추정이 정확하다는 뜻이죠.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;그 폭은 다음 세 가지 요인으로 결정됩니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;요인&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 효과&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;이유&lt;/b&gt;&lt;/p&gt;
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody&gt;
&lt;tr&gt;
&lt;td&gt;표본 크기 &amp;uarr;&lt;/td&gt;
&lt;td&gt;구간 &amp;darr;&lt;/td&gt;
&lt;td&gt;표준오차가 작아짐&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;표준편차 &amp;darr;&lt;/td&gt;
&lt;td&gt;구간 &amp;darr;&lt;/td&gt;
&lt;td&gt;데이터 일관성이 높음&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;신뢰수준 &amp;uarr;&lt;/td&gt;
&lt;td&gt;구간 &amp;uarr;&lt;/td&gt;
&lt;td&gt;더 &amp;ldquo;안전하게&amp;rdquo; 잡음&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;즉, 더 많이 보고, 일관된 데이터를 모을수록, 더 정확한 추정이 가능하다.&lt;/blockquote&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;7. 실무에서의 예시&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;1. 제조 품질관리&lt;/b&gt;&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;&quot;부품 길이의 평균은 50.0&amp;plusmn;0.2mm (95% 신뢰수준)&quot;&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; -&amp;gt; 평균뿐 아니라 불확실성까지 명시&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;2. 고객 만족도 조사&lt;/b&gt;&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;&quot;만족 고객 비율은 82%&amp;plusmn;3% (95% 신뢰수준)&quot;&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;-&amp;gt; 표본의 불확실성을 반영&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;3. A/B테스트&lt;/b&gt;&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;&quot;전환율 차이가 1.2%p, 95% 신뢰구간 [0.5, 1.9]&quot;&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; -&amp;gt;0을 포함하지 않으면 &quot;통계적으로 유의한 차이&quot;&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;8. 한 장 요약&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;개념&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;설명&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 핵심 포인트&lt;/b&gt;&lt;/p&gt;
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody&gt;
&lt;tr&gt;
&lt;td&gt;점추정&lt;/td&gt;
&lt;td&gt;모집단의 값을 하나의 수로 추정&lt;/td&gt;
&lt;td&gt;깔끔하지만 불확실함이 큼&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;구간추정&lt;/td&gt;
&lt;td&gt;신뢰구간으로 불확실성 표현&lt;/td&gt;
&lt;td&gt;신뢰수준과 표본크기로 결정&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;신뢰수준&lt;/td&gt;
&lt;td&gt;반복 실험에서 진짜 평균이 포함될 확률&lt;/td&gt;
&lt;td&gt;95%가 가장 일반적&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;표준오차&lt;/td&gt;
&lt;td&gt;표본평균의 변동성&lt;/td&gt;
&lt;td&gt;표본이 많을수록 작아짐&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;핵심 해석&lt;/td&gt;
&lt;td&gt;추정값 &amp;plusmn; 불확실성&lt;/td&gt;
&lt;td&gt;&amp;ldquo;숫자만 믿지 말고, 신뢰 범위를 보라.&amp;rdquo;&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style1&quot;&gt;&lt;span style=&quot;font-family: 'Noto Serif KR';&quot;&gt;&quot;통계는 '정답'을 말하지 않습니다.&lt;br /&gt;&lt;/span&gt;대신 '얼마나 믿을 만한가'를 알려주죠.&quot;&lt;/blockquote&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;</description>
      <category>Statistics/기초 통계</category>
      <category>구간추정</category>
      <category>기초통계학</category>
      <category>데이터분석</category>
      <category>데이터사이언스</category>
      <category>신뢰구간</category>
      <category>점추정</category>
      <category>통계</category>
      <category>표준오차</category>
      <author>Allen93</author>
      <guid isPermaLink="true">https://allensdatablog.tistory.com/465</guid>
      <comments>https://allensdatablog.tistory.com/entry/9-%EC%A0%90%EC%B6%94%EC%A0%95%EA%B3%BC-%EA%B5%AC%EA%B0%84%EC%B6%94%EC%A0%95-%EC%88%AB%EC%9E%90-%ED%95%98%EB%82%98%EC%97%90-%EB%8B%B4%EA%B8%B4-%EB%B6%88%ED%99%95%EC%8B%A4%ED%95%A8%EC%9D%98-%ED%81%AC%EA%B8%B0#entry465comment</comments>
      <pubDate>Mon, 29 Dec 2025 12:28:39 +0900</pubDate>
    </item>
    <item>
      <title>7. 정규분포 - 세상의 중심으로 모이는 이유</title>
      <link>https://allensdatablog.tistory.com/entry/7-%EC%A0%95%EA%B7%9C%EB%B6%84%ED%8F%AC-%EC%84%B8%EC%83%81%EC%9D%98-%EC%A4%91%EC%8B%AC%EC%9C%BC%EB%A1%9C-%EB%AA%A8%EC%9D%B4%EB%8A%94-%EC%9D%B4%EC%9C%A0</link>
      <description>&lt;p&gt;&lt;figure class=&quot;imageblock alignCenter&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;1024&quot; data-origin-height=&quot;1024&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/bb6JzT/dJMcaelGxN1/x4CcibICp8U6eknkSA0cqK/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/bb6JzT/dJMcaelGxN1/x4CcibICp8U6eknkSA0cqK/img.png&quot; data-alt=&quot;정규분포&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/bb6JzT/dJMcaelGxN1/x4CcibICp8U6eknkSA0cqK/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2Fbb6JzT%2FdJMcaelGxN1%2Fx4CcibICp8U6eknkSA0cqK%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;518&quot; height=&quot;518&quot; data-origin-width=&quot;1024&quot; data-origin-height=&quot;1024&quot;/&gt;&lt;/span&gt;&lt;figcaption&gt;정규분포&lt;/figcaption&gt;
&lt;/figure&gt;
&lt;/p&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;&amp;nbsp;&lt;/h3&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;1. 세상은 '평균 쪽으로' 기울어져 있습니다&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;사람 키, 시험 점수, 자동차 엔진 수명,&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;심지어 커피 한 잔의 카페인 함량까지 ㅡ&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이 모든 게 놀랍도록 비슷한 모양의 그래프를 그립니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;가운데가 가장 높고, 양쪽으로 갈수록 낮아지는 &lt;b&gt;종(bell) 모양의 곡선.&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이게 바로 &lt;b&gt;정규분포&lt;/b&gt;예요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;&quot;평균 근처의 일이 가장 잘 일어나고,&lt;br /&gt;너무 작거나 너무 큰 일은 드물다.&quot;&lt;/blockquote&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이게 세상의 기본 패턴이에요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;완벽하지는 않지만, 꽤 많은 현상이 이 법칙을 따릅니다.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;2. 정의는 간단하지만, 의미는 깊어요&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;정규분포의 확률밀도함수는 이렇게 생겼어요.&lt;/p&gt;
&lt;p&gt;&lt;figure class=&quot;imageblock alignLeft&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;186&quot; data-origin-height=&quot;63&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/bdEH5x/dJMcaaDApiO/YCah7zJJzAELrTGNmGQDfk/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/bdEH5x/dJMcaaDApiO/YCah7zJJzAELrTGNmGQDfk/img.png&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/bdEH5x/dJMcaaDApiO/YCah7zJJzAELrTGNmGQDfk/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2FbdEH5x%2FdJMcaaDApiO%2FYCah7zJJzAELrTGNmGQDfk%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;186&quot; height=&quot;63&quot; data-origin-width=&quot;186&quot; data-origin-height=&quot;63&quot;/&gt;&lt;/span&gt;&lt;/figure&gt;
&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;수식은 복잡해 보이지만, 각 부분의 의미는 명확합니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;기호&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;의미&lt;/b&gt;&lt;/p&gt;
&lt;table style=&quot;border-collapse: collapse; width: 100%; height: 64px;&quot; border=&quot;1&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody&gt;
&lt;tr style=&quot;height: 18px;&quot;&gt;
&lt;td style=&quot;height: 18px;&quot;&gt;&amp;mu;&lt;/td&gt;
&lt;td style=&quot;height: 18px;&quot;&gt;평균(중심)&lt;/td&gt;
&lt;/tr&gt;
&lt;tr style=&quot;height: 18px;&quot;&gt;
&lt;td style=&quot;height: 18px;&quot;&gt;&amp;sigma;&lt;/td&gt;
&lt;td style=&quot;height: 18px;&quot;&gt;표준편차(퍼짐 정도)&lt;/td&gt;
&lt;/tr&gt;
&lt;tr style=&quot;height: 18px;&quot;&gt;
&lt;td style=&quot;height: 18px;&quot;&gt;e&lt;/td&gt;
&lt;td style=&quot;height: 18px;&quot;&gt;자연상수(&amp;asymp; 2.718) &amp;mdash; 곡선의 부드러움을 만듦&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;즉,&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;중심은 평균 &amp;mu;&lt;/li&gt;
&lt;li&gt;폭은 표준편차 &amp;sigma;&lt;/li&gt;
&lt;li&gt;확률이 떨어지는 속도든 e-거리^2&lt;/li&gt;
&lt;/ul&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;평균에서 멀어질수록 확률은 급격히 줄어든다.&lt;/blockquote&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;3. 68 - 95 - 99.7 법칙 : 정규분포를 감각적으로 읽는 법&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;정규분포에서 표준편차 단위로 구간을 보면 놀라운 일정함이 나옵니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;구간&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;포함 비율&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 의미&lt;/b&gt;&lt;/p&gt;
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody&gt;
&lt;tr&gt;
&lt;td&gt;&amp;mu; &amp;plusmn; 1&amp;sigma;&lt;/td&gt;
&lt;td&gt;약 68%&lt;/td&gt;
&lt;td&gt;대부분 평균 근처&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;&amp;mu; &amp;plusmn; 2&amp;sigma;&lt;/td&gt;
&lt;td&gt;약 95%&lt;/td&gt;
&lt;td&gt;거의 전체&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;&amp;mu; &amp;plusmn; 3&amp;sigma;&lt;/td&gt;
&lt;td&gt;약 99.7%&lt;/td&gt;
&lt;td&gt;극단적으로 드문 일&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;예를 들어 사람 키가 평균 170cm, 표준편차 5cm 라면,&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;대부분의 사람(약 95%)은 &lt;b&gt;160~180cm&lt;/b&gt; 사이에 있어요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;그보다 작거나 큰 사람은 드물죠.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이 단순한 규칙이 &lt;b&gt;품질관리, 센서 검증, 시험 점수 평가&lt;/b&gt;까지&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;수많은 현실 문제의 근간이 됩니다.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;4. 정규분포의 탄생 - 중심극한정리의 마법&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&quot;왜 이렇게 많은 데이터가 정규분포를 따를까?&quot;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;그 답은 &lt;b&gt;중심극한정리(Central Limit Theorem, CLT)&lt;/b&gt;에 있습니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;한마디로 말하면 이렇습니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;&quot;서로 다른 여러 요인의 합은,&lt;br /&gt;결국 정규분포에 가까워진다.&quot;&lt;/blockquote&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;사람 키를 예로 들어볼게요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;키는 유전, 영양, 수면, 운동 등 수많은 작은 요인의 합이에요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;각 요인이 조금씩 영향을 주다 보면,&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;결국 평균 근처로 몰리게 되죠.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이건 단순히 자연 현상뿐 아니라&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;데이터 분석 전반에 깔려 있는 기본 원리예요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;정규분포를 세상이 복잡하다는 사실의 결과물이에요.&lt;br /&gt;여러 변수의 합은 결국 평균으로 모입니다.&lt;/blockquote&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;5. 표준정규분포: 모든 걸 하나의 눈금으로&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;정규분포는 평균과 표준편차가 다르기 때문에&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;서로 비교하기 어렵죠.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;그래서 통계에서는 &lt;b&gt;표준화(Standardization)&lt;/b&gt;를 사용합니다.&lt;/p&gt;
&lt;p&gt;&lt;figure class=&quot;imageblock alignLeft&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;106&quot; data-origin-height=&quot;60&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/xYq5D/dJMcaeTwt9v/EtatjBvk74YAWBk3p2IOGK/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/xYq5D/dJMcaeTwt9v/EtatjBvk74YAWBk3p2IOGK/img.png&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/xYq5D/dJMcaeTwt9v/EtatjBvk74YAWBk3p2IOGK/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2FxYq5D%2FdJMcaeTwt9v%2FEtatjBvk74YAWBk3p2IOGK%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;106&quot; height=&quot;60&quot; data-origin-width=&quot;106&quot; data-origin-height=&quot;60&quot;/&gt;&lt;/span&gt;&lt;/figure&gt;
&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이 식을 통해 모든 데이터를 &quot;평균 0, 표준편차 1&quot;로 바꿔요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이게 바로 표준정규분포(Z 분포) 예요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;예를 들어 시험 점수 85점, 평균 80점, 표준편차 5점이라면&lt;/p&gt;
&lt;p&gt;&lt;figure class=&quot;imageblock alignLeft&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;149&quot; data-origin-height=&quot;63&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/DJKQS/dJMcain5kVM/LRnpDBAb1h3JvUWHNse1FK/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/DJKQS/dJMcain5kVM/LRnpDBAb1h3JvUWHNse1FK/img.png&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/DJKQS/dJMcain5kVM/LRnpDBAb1h3JvUWHNse1FK/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2FDJKQS%2FdJMcain5kVM%2FLRnpDBAb1h3JvUWHNse1FK%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;149&quot; height=&quot;63&quot; data-origin-width=&quot;149&quot; data-origin-height=&quot;63&quot;/&gt;&lt;/span&gt;&lt;/figure&gt;
&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;즉, 이 학생은 평균보다 &quot;1 표준편차&quot; 높은 위치에 있다는 뜻이에요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;Z값으로 바꾸면 &lt;b&gt;서로 다른 데이터의 상대적 위치를 비교&lt;/b&gt;할 수 있습니다.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;6. 현실 속 정규분포&lt;/h3&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;품질관리(QC) : 제품의 길이, 무게, 압력 값&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;-&amp;gt; 평균에서 &amp;plusmn; 3&amp;sigma; 벗어나면 불량 판정&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;교육평가 : 시험 점수의 상대적 위치(Z점수, 표준점수)&lt;/li&gt;
&lt;li&gt;금융 : 투자 수익률의 변동&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; -&amp;gt; 위험 관리의 기본 척도&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;거의 모든 데이터가 완벽한 정규분포를 따르진 않지만,&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;대부분의 분석은 &quot;정규분포 근사&quot;를 기본 한정으로 둡니다.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;7. 한 장 요약&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;개념&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 의미&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 포인트&lt;/b&gt;&lt;/p&gt;
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody&gt;
&lt;tr&gt;
&lt;td&gt;정규분포&lt;/td&gt;
&lt;td&gt;평균을 중심으로 좌우대칭인 종형 분포&lt;/td&gt;
&lt;td&gt;세상의 기본 패턴&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;평균 &amp;mu;&lt;/td&gt;
&lt;td&gt;중심 위치&lt;/td&gt;
&lt;td&gt;데이터의 중심&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;표준편차 &amp;sigma;&lt;/td&gt;
&lt;td&gt;폭, 변동성&lt;/td&gt;
&lt;td&gt;퍼질수록 완만해짐&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;68&amp;ndash;95&amp;ndash;99.7 법칙&lt;/td&gt;
&lt;td&gt;표준편차 기준 확률&lt;/td&gt;
&lt;td&gt;데이터의 대부분은 &amp;mu; &amp;plusmn; 2&amp;sigma; 안&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;중심극한정리&lt;/td&gt;
&lt;td&gt;여러 요인의 합 &amp;rarr; 정규분포&lt;/td&gt;
&lt;td&gt;복잡한 세상의 자연스러운 결과&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;표준정규분포&lt;/td&gt;
&lt;td&gt;&amp;mu;=0, &amp;sigma;=1&lt;/td&gt;
&lt;td&gt;비교와 계산의 기준 축&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style1&quot;&gt;&lt;span style=&quot;font-family: 'Noto Serif KR';&quot;&gt;&quot;정규분포는 세상의 평균으로 향하는 힘을 그린 그래프예요.&lt;br /&gt;&lt;/span&gt;모든 통계가 결국 여기로 돌아옵니다.&quot;&lt;/blockquote&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;</description>
      <category>Statistics/기초 통계</category>
      <category>기초통계학</category>
      <category>데이터분석</category>
      <category>데이터분포</category>
      <category>데이터사이언스</category>
      <category>정규분포</category>
      <category>중심극한정리</category>
      <category>통계</category>
      <category>표준정규분포</category>
      <category>표준화</category>
      <author>Allen93</author>
      <guid isPermaLink="true">https://allensdatablog.tistory.com/464</guid>
      <comments>https://allensdatablog.tistory.com/entry/7-%EC%A0%95%EA%B7%9C%EB%B6%84%ED%8F%AC-%EC%84%B8%EC%83%81%EC%9D%98-%EC%A4%91%EC%8B%AC%EC%9C%BC%EB%A1%9C-%EB%AA%A8%EC%9D%B4%EB%8A%94-%EC%9D%B4%EC%9C%A0#entry464comment</comments>
      <pubDate>Sat, 27 Dec 2025 09:36:09 +0900</pubDate>
    </item>
    <item>
      <title>8.중심극한정리와 표본평균 - 불확실한 세상 속의 안정된 평균</title>
      <link>https://allensdatablog.tistory.com/entry/7%EC%A4%91%EC%8B%AC%EA%B7%B9%ED%95%9C%EC%A0%95%EB%A6%AC%EC%99%80-%ED%91%9C%EB%B3%B8%ED%8F%89%EA%B7%A0-%EB%B6%88%ED%99%95%EC%8B%A4%ED%95%9C-%EC%84%B8%EC%83%81-%EC%86%8D%EC%9D%98-%EC%95%88%EC%A0%95%EB%90%9C-%ED%8F%89%EA%B7%A0</link>
      <description>&lt;h3 data-ke-size=&quot;size23&quot;&gt;1. 표본 하나로 세상을 알 수 있을까?&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;자동차 공장에서 부품 10,00개를 만들었다고 합시다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이 중 몇 개만 뽑아서 평균 무게를 잴 때, 그 평균은 과연 믿을 만할까요?&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;표본 평균이 모집단 평균과 얼마나 다를까?&lt;/li&gt;
&lt;li&gt;표본을 여러 번 뽑으면 결과가 들쭉날쭉할까?&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이때 등장하는 개념이 바로 &lt;b&gt;표본평균의 분포(Sampling Distribusion of th Mean)입니다.&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;그리고 이걸 통계적으로 설명하는 것이 바로 중심극한정리예요.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;2. 중심극한정리, 한 문장으로 말하면&lt;/h3&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;&quot;표본을 충분히 많이 뽑아 그 평균을 구하면,&lt;br /&gt;그 평균들은 원래 분포가 어떤 모양이든 결국 정규분포를 따른다.&quot;&lt;/blockquote&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이게 전부입니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;정말 단순하지만, 통계학이 굴러가는 핵심 원리예요.&lt;/p&gt;
&lt;p&gt;&lt;figure class=&quot;imageblock alignCenter&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;1024&quot; data-origin-height=&quot;1024&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/bfu0AE/dJMcakzqZlf/kMBvoqZUEk2fHrqpkZJ3s1/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/bfu0AE/dJMcakzqZlf/kMBvoqZUEk2fHrqpkZJ3s1/img.png&quot; data-alt=&quot;중심극한정리&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/bfu0AE/dJMcakzqZlf/kMBvoqZUEk2fHrqpkZJ3s1/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2Fbfu0AE%2FdJMcakzqZlf%2FkMBvoqZUEk2fHrqpkZJ3s1%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;593&quot; height=&quot;593&quot; data-origin-width=&quot;1024&quot; data-origin-height=&quot;1024&quot;/&gt;&lt;/span&gt;&lt;figcaption&gt;중심극한정리&lt;/figcaption&gt;
&lt;/figure&gt;
&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;3. 한눈에 보는 구조&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;개념&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;의미&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;비유&lt;/b&gt;&lt;/p&gt;
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody&gt;
&lt;tr&gt;
&lt;td&gt;모집단 (Population)&lt;/td&gt;
&lt;td&gt;우리가 알고 싶은 전체&lt;/td&gt;
&lt;td&gt;공장의 모든 부품&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;표본 (Sample)&lt;/td&gt;
&lt;td&gt;그중 일부&lt;/td&gt;
&lt;td&gt;검사로 뽑은 30개&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;표본평균 (Sample Mean)&lt;/td&gt;
&lt;td&gt;표본의 평균값&lt;/td&gt;
&lt;td&gt;뽑은 부품의 평균 무게&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;표본분포 (Sampling Distribution)&lt;/td&gt;
&lt;td&gt;표본평균들을 여러 번 구했을 때의 분포&lt;/td&gt;
&lt;td&gt;같은 작업을 반복했을 때 평균들의 모양&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;즉, 한 번의 평균은 불안정할 수 있지만,&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;평균들의 평균은 점점 안정적인 정규분포로 모입니다.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;4. 조금 더 수학적으로 보면&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;표본의 크기를 n, 모집단의 평균을 &lt;span&gt;&lt;span&gt;&amp;mu;&lt;/span&gt;&lt;/span&gt;, 표준편차를 &lt;span&gt;&lt;span&gt;&amp;sigma;라&lt;/span&gt;&lt;/span&gt;&amp;nbsp;할 때,&lt;/p&gt;
&lt;p&gt;&lt;figure class=&quot;imageblock alignLeft&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;150&quot; data-origin-height=&quot;73&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/bMdE7z/dJMcacg58Pj/KjIfMk0STnasEPIxsqbWBk/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/bMdE7z/dJMcacg58Pj/KjIfMk0STnasEPIxsqbWBk/img.png&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/bMdE7z/dJMcacg58Pj/KjIfMk0STnasEPIxsqbWBk/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2FbMdE7z%2FdJMcacg58Pj%2FKjIfMk0STnasEPIxsqbWBk%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;150&quot; height=&quot;73&quot; data-origin-width=&quot;150&quot; data-origin-height=&quot;73&quot;/&gt;&lt;/span&gt;&lt;/figure&gt;
&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;즉,&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;표본평균의 평균은 모집단 평균과 같다.&lt;/li&gt;
&lt;li&gt;표본평균의 표준편차(=표준오차)는 작아진다.&lt;/li&gt;
&lt;/ul&gt;
&lt;p&gt;&lt;figure class=&quot;imageblock alignLeft&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;107&quot; data-origin-height=&quot;65&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/ewdhSo/dJMcaeeUNUq/R2Hz0s7PvgWlZiQNAKteek/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/ewdhSo/dJMcaeeUNUq/R2Hz0s7PvgWlZiQNAKteek/img.png&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/ewdhSo/dJMcaeeUNUq/R2Hz0s7PvgWlZiQNAKteek/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2FewdhSo%2FdJMcaeeUNUq%2FR2Hz0s7PvgWlZiQNAKteek%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;107&quot; height=&quot;65&quot; data-origin-width=&quot;107&quot; data-origin-height=&quot;65&quot;/&gt;&lt;/span&gt;&lt;/figure&gt;
&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;표본이 커질수록 평균이 안정된다.&lt;br /&gt;(100개를 뽑는 게 10개를 뽑는 것보다 훨씬 신뢰할 수 있는 이유죠.)&lt;/blockquote&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;5. 정규분포가 되는 마법&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;모집단이 꼭 정규분포일 필요는 없어요.&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;왜곡된 분포든,&lt;/li&gt;
&lt;li&gt;한쪽으로 치우친 분포든,&lt;/li&gt;
&lt;li&gt;심지어 불연속적인 데이터라도&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;표본크기 n이 충분히 커지면&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;그 표본평균의 분포는 점점 정규분포에 가까워집니다.&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;즉, &quot;복잡한 세상도, 많이 모으면 평범해진다.&quot;&lt;/blockquote&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;6. 실감 나는 예시&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;예시 1. 공정 검사&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;부품의 무게가 균일하지 않아도,&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;100개 단위로 묶어 평균을 내면 그 값들은 종 모양을 그립니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;그래서 &lt;b&gt;QC(품질관리)&lt;/b&gt;에서는 항상 표본평균을 모니터링하죠.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;예시 2. 시험 점수&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;개별 문제 점수는 다양하지만,&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;30문제의 평균 점수는 대부분 정규분포 형태를 보입니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;예시 3. 머신러닝 모델&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;모델을 여러 번 학습시켜 얻은 평균 정확도 값이&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;정규분포 근처에 모이는 이유도 같은 원리예요.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;7. 표본이 커질수록 변동이 줄어드는 이유&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;표본평균의 표준편차(표준오차)는&lt;/p&gt;
&lt;p&gt;&lt;figure class=&quot;imageblock alignLeft&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;107&quot; data-origin-height=&quot;71&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/ZEXmO/dJMcaiO9AcW/SdtRqXbCX1B2M7XtsrvMK0/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/ZEXmO/dJMcaiO9AcW/SdtRqXbCX1B2M7XtsrvMK0/img.png&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/ZEXmO/dJMcaiO9AcW/SdtRqXbCX1B2M7XtsrvMK0/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2FZEXmO%2FdJMcaiO9AcW%2FSdtRqXbCX1B2M7XtsrvMK0%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;107&quot; height=&quot;71&quot; data-origin-width=&quot;107&quot; data-origin-height=&quot;71&quot;/&gt;&lt;/span&gt;&lt;/figure&gt;
&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이 식은 통계학에서 가장 중요한 공식을 꼽을 만해요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;표본 크기 n&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;표준오차 크기&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 의미&lt;/b&gt;&lt;/p&gt;
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody&gt;
&lt;tr&gt;
&lt;td&gt;4배 증가&lt;/td&gt;
&lt;td&gt;절반으로 감소&lt;/td&gt;
&lt;td&gt;큰 표본은 안정적&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;9배 증가&lt;/td&gt;
&lt;td&gt;1/3로 감소&lt;/td&gt;
&lt;td&gt;평균이 훨씬 정확&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;즉, n이 커질수록 불확실성이 줄어드는 거예요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;통계는 표본의 수로 신뢰를 쌓는 학문&lt;/b&gt;입니다.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;8. 현실 속 중심극한정리&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;제조업 -&amp;gt;&lt;/b&gt; 공정별 샘플링 평균이 정규분포를 따르기 때문에, 관리도가 가능.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;금융 -&amp;gt;&lt;/b&gt; 일별 수익률 평균을 분석할 때, CLT를 가정해야 리스크 계산이 가능.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;데이터 분석 -&amp;gt;&lt;/b&gt; 평균 기반 가설검정(t-test 등)의 전제가 CLT입니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;CLT가 없다면, t검정도, 신뢰구간도, 회귀분석도 전부 불가능합니다.&lt;br /&gt;통계의 모든 추론은 &quot;평균이 정규분포로 수렴한다&quot;는 가정 위에서 돌아갑니다.&lt;/blockquote&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;9. 한 장 요약&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;개념&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 의미&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 포인트&lt;/b&gt;&lt;/p&gt;
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody&gt;
&lt;tr&gt;
&lt;td&gt;중심극한정리&lt;/td&gt;
&lt;td&gt;표본평균은 결국 정규분포를 따른다&lt;/td&gt;
&lt;td&gt;통계의 핵심 원리&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;표본평균&lt;/td&gt;
&lt;td&gt;표본의 평균값&lt;/td&gt;
&lt;td&gt;모집단 평균의 근사치&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;표준오차&lt;/td&gt;
&lt;td&gt;평균의 불확실성&lt;/td&gt;
&lt;td&gt;표본이 많을수록 작아짐&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;분포의 수렴&lt;/td&gt;
&lt;td&gt;모집단 분포와 무관&lt;/td&gt;
&lt;td&gt;반복이 많아질수록 정규화&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;통계의 신뢰성&lt;/td&gt;
&lt;td&gt;CLT가 만드는 기반&lt;/td&gt;
&lt;td&gt;모든 검정의 근거&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style1&quot;&gt;&lt;span style=&quot;font-family: 'Noto Serif KR';&quot;&gt;&quot;세상은 혼란스럽지만, 평균은 결국 질서를 만든다.&quot;&lt;/span&gt;&lt;/blockquote&gt;</description>
      <category>Statistics/기초 통계</category>
      <category>Ai</category>
      <category>기초통계학</category>
      <category>데이터분석</category>
      <category>데이터사이언스</category>
      <category>정규분포</category>
      <category>중심극한정리</category>
      <category>표본평균</category>
      <category>표준오차</category>
      <author>Allen93</author>
      <guid isPermaLink="true">https://allensdatablog.tistory.com/463</guid>
      <comments>https://allensdatablog.tistory.com/entry/7%EC%A4%91%EC%8B%AC%EA%B7%B9%ED%95%9C%EC%A0%95%EB%A6%AC%EC%99%80-%ED%91%9C%EB%B3%B8%ED%8F%89%EA%B7%A0-%EB%B6%88%ED%99%95%EC%8B%A4%ED%95%9C-%EC%84%B8%EC%83%81-%EC%86%8D%EC%9D%98-%EC%95%88%EC%A0%95%EB%90%9C-%ED%8F%89%EA%B7%A0#entry463comment</comments>
      <pubDate>Tue, 23 Dec 2025 18:39:36 +0900</pubDate>
    </item>
    <item>
      <title>6. 이항분포 - 성공과 실패,</title>
      <link>https://allensdatablog.tistory.com/entry/6-%EC%9D%B4%ED%95%AD%EB%B6%84%ED%8F%AC-%EC%84%B1%EA%B3%B5%EA%B3%BC-%EC%8B%A4%ED%8C%A8</link>
      <description>&lt;p&gt;&lt;figure class=&quot;imageblock alignCenter&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;1024&quot; data-origin-height=&quot;1024&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/DA4Ec/dJMcaiO9hnQ/ro60lvgA2PQ7apG7NdcKf1/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/DA4Ec/dJMcaiO9hnQ/ro60lvgA2PQ7apG7NdcKf1/img.png&quot; data-alt=&quot;이항분포&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/DA4Ec/dJMcaiO9hnQ/ro60lvgA2PQ7apG7NdcKf1/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2FDA4Ec%2FdJMcaiO9hnQ%2Fro60lvgA2PQ7apG7NdcKf1%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;503&quot; height=&quot;503&quot; data-origin-width=&quot;1024&quot; data-origin-height=&quot;1024&quot;/&gt;&lt;/span&gt;&lt;figcaption&gt;이항분포&lt;/figcaption&gt;
&lt;/figure&gt;
&lt;/p&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;1. 동전 던지기와 품질검사, 같은 이야기&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;동전을 10번 던졌을 때, 앞면이 정확히 6번 나올 확률은 얼마일까요?&quot;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;혹은 하루에 생산된 부품 100개 중 &lt;b&gt;불량이 3개일 확률&lt;/b&gt;은?&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이 두 상황은 전혀 달라 보이지만, 수학적으로는 완전히 같은 문제예요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;둘 다 다음 조건을 만족하죠.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;1. 결과는 두 가지뿐이다. -&amp;gt; &lt;b&gt;성공 / 실패&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;2. 각 시행은 독립적이다. -&amp;gt; &lt;b&gt;앞면이 나왔다고 다음에 영향 없음&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;3. 성공 확률은 일정하다. -&amp;gt; &lt;b&gt;p가 변하지 않음&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;4. 시행 횟수 n이 정해져 있다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이 네 가지 조건이 충족될 때, 우리는 &quot;이항분포를 따른다&quot;라고 말합니다.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;2. 수식은 짧고, 의미는 깊다&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이항분포의 확률은 이렇게 생겼어요.&lt;/p&gt;
&lt;p&gt;&lt;figure class=&quot;imageblock alignLeft&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;274&quot; data-origin-height=&quot;63&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/z1K5V/dJMcacVHntB/DIMkB8MirWkr1l5oNLWS3K/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/z1K5V/dJMcacVHntB/DIMkB8MirWkr1l5oNLWS3K/img.png&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/z1K5V/dJMcacVHntB/DIMkB8MirWkr1l5oNLWS3K/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2Fz1K5V%2FdJMcacVHntB%2FDIMkB8MirWkr1l5oNLWS3K%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;274&quot; height=&quot;63&quot; data-origin-width=&quot;274&quot; data-origin-height=&quot;63&quot;/&gt;&lt;/span&gt;&lt;/figure&gt;
&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;기호&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 의미&lt;/b&gt;&lt;/p&gt;
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody&gt;
&lt;tr&gt;
&lt;td&gt;(n)&lt;/td&gt;
&lt;td&gt;시행 횟수&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;(k)&lt;/td&gt;
&lt;td&gt;성공 횟수&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;(p)&lt;/td&gt;
&lt;td&gt;성공 확률&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;({n}{k})&lt;/td&gt;
&lt;td&gt;n번 중 k번 성공할 수 있는 조합의 수&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이걸 직관적으로 해석하면 이래요,&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;&quot;전체 n번 중 k번 성공하는 모든 경우의 수 x 그 경우가 일어날 확률.&quot;&lt;/blockquote&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;예를 들어, 부품 하나가 불량일 확률이 0.02(p=0.02)이고&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;총 100개(n=100)를 검사했을 때,&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;정확히 3개가 불량일 확률은 아래처럼 됩니다.&lt;/p&gt;
&lt;p&gt;&lt;figure class=&quot;imageblock alignLeft&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;294&quot; data-origin-height=&quot;59&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/bC4ohe/dJMcaksE61O/CgIL0bGhUxKMSVosxd46qK/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/bC4ohe/dJMcaksE61O/CgIL0bGhUxKMSVosxd46qK/img.png&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/bC4ohe/dJMcaksE61O/CgIL0bGhUxKMSVosxd46qK/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2FbC4ohe%2FdJMcaksE61O%2FCgIL0bGhUxKMSVosxd46qK%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;294&quot; height=&quot;59&quot; data-origin-width=&quot;294&quot; data-origin-height=&quot;59&quot;/&gt;&lt;/span&gt;&lt;/figure&gt;
&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;계산은 복잡하지만, 뜻은 간단하죠.&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;&quot;3개만 불량일 가능성 = &lt;br /&gt;(3개가 딱 불량이 되는 경우의 수) x (그럴 확률).&quot;&lt;/blockquote&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;3. 이항분포의 중심 - 평균과 분산&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이항분포는 아주 아름다운 특징이 있습니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;그 중심(평균)과 퍼짐(분산)이 깔끔하게 정리돼요.&lt;/p&gt;
&lt;p&gt;&lt;figure class=&quot;imageblock alignLeft&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;305&quot; data-origin-height=&quot;50&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/bSmcLs/dJMcafx7BaG/0nXqU0T2fOJr6zF5oHhY6k/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/bSmcLs/dJMcafx7BaG/0nXqU0T2fOJr6zF5oHhY6k/img.png&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/bSmcLs/dJMcafx7BaG/0nXqU0T2fOJr6zF5oHhY6k/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2FbSmcLs%2FdJMcafx7BaG%2F0nXqU0T2fOJr6zF5oHhY6k%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;305&quot; height=&quot;50&quot; data-origin-width=&quot;305&quot; data-origin-height=&quot;50&quot;/&gt;&lt;/span&gt;&lt;/figure&gt;
&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;개념&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;의미&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;예시&lt;/b&gt;&lt;/p&gt;
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody&gt;
&lt;tr&gt;
&lt;td&gt;평균&lt;/td&gt;
&lt;td&gt;기대되는 성공 횟수&lt;/td&gt;
&lt;td&gt;100개 중 불량률 2% &amp;rarr; 평균 불량 2개&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;분산&lt;/td&gt;
&lt;td&gt;변동성, 불확실성의 크기&lt;/td&gt;
&lt;td&gt;(100&amp;times;0.02&amp;times;0.98=1.96) &amp;rarr; 표준편차 &amp;asymp; 1.4개&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;즉, 100개 검사하면 &lt;b&gt;평균적으로 2개가 불량,&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;하지만 실제로는 0개일 수도, 4개일 수도 있다는 거죠.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이 불확실함을 수학으로 그려주는 게 바로 이항분포예요.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;4. 모양으로 보는 이항분포&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;확률은 말보단 그림으로 이해하는 게 훨씬 빨라요.&lt;/p&gt;
&lt;p&gt;&lt;figure class=&quot;imageblock alignLeft&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;1024&quot; data-origin-height=&quot;1024&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/pgJlG/dJMcacg5Snz/vqUlVPqGkzkPonJlcCinOk/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/pgJlG/dJMcacg5Snz/vqUlVPqGkzkPonJlcCinOk/img.png&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/pgJlG/dJMcacg5Snz/vqUlVPqGkzkPonJlcCinOk/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2FpgJlG%2FdJMcacg5Snz%2FvqUlVPqGkzkPonJlcCinOk%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;424&quot; height=&quot;424&quot; data-origin-width=&quot;1024&quot; data-origin-height=&quot;1024&quot;/&gt;&lt;/span&gt;&lt;/figure&gt;
&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;&lt;b&gt;p=0.5, n=10&lt;/b&gt; -&amp;gt; 대칭 모양 (동전 10번 던지기)&lt;/li&gt;
&lt;li&gt;&lt;b&gt;p &amp;lt;0.5&lt;/b&gt; -&amp;gt; 왼쪽으로 치우침 (불량이 드문 경우)&lt;/li&gt;
&lt;li&gt;&lt;b&gt;p&amp;gt;0.5&lt;/b&gt; -&amp;gt; 오른쪽으로 치우침 ( 성공이 대부분인 경우)&lt;/li&gt;
&lt;/ul&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;5. 현실 속 이항분포&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;1. 품질관리&lt;/b&gt; - 부품 100개 중 불량이 2개 이하일 확률&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;2. 마케팅&lt;/b&gt; - 1,000명에게 메일을 보냈을 때 클릭이 50명 이상일 확률&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;3. 의학&lt;/b&gt; - 약 복용자 20명 중 부작용이 3명 이하일 확률&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이런 계산이 다 이항분포예요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;심지어 AI 모델의 &quot;정확도(Accuracy)&quot;도&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;실은 '정답 맞춘 횟수 / 전체시도' -&amp;gt; 이항적 사건이에요.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;6. 실무 감각 한 스푼&lt;/h3&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;p가 작고 n이 클 때, 계산이 복잡해지면 포아송분포(Poisson)로 근사할 수 있어요.&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp; &amp;nbsp; &amp;nbsp; (이건 나중에 다뤄보겠습니다.)&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;n이 충분히 크고 p가 0.5 근처일 때, 정규분포로 근사가 가능합니다.&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp; &amp;nbsp; &amp;nbsp; 즉, 이항분포는 통계의 중심 고속도로예요.&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;표본이 작을 때엔 직접 이항 계산을,&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp; &amp;nbsp; &amp;nbsp; 표본이 클 때엔 정규 근사를 쓰는 게 일반적이에요.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;7. 한 장 요약&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;개념&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;의미&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 핵심 포인트&lt;/b&gt;&lt;/p&gt;
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody&gt;
&lt;tr&gt;
&lt;td&gt;이항분포&lt;/td&gt;
&lt;td&gt;n번 시행 중 k번 성공 확률&lt;/td&gt;
&lt;td&gt;성공/실패 두 가지 결과의 모델&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;조건&lt;/td&gt;
&lt;td&gt;독립, 동일확률, 이진결과, 고정된 n&lt;/td&gt;
&lt;td&gt;&amp;nbsp;&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;확률식&lt;/td&gt;
&lt;td&gt;(P(X=k)=\binom{n}{k}p^k(1-p)^{n-k})&lt;/td&gt;
&lt;td&gt;조합 &amp;times; 확률의 곱&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;평균/분산&lt;/td&gt;
&lt;td&gt;(E(X)=np, Var(X)=np(1-p))&lt;/td&gt;
&lt;td&gt;기대성과 변동성&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;근사&lt;/td&gt;
&lt;td&gt;p&amp;asymp;0.5 &amp;rarr; 정규, p작고n큼 &amp;rarr; 포아송&lt;/td&gt;
&lt;td&gt;&amp;nbsp;&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;현실 활용&lt;/td&gt;
&lt;td&gt;품질, 클릭률, 실험 성공률&lt;/td&gt;
&lt;td&gt;가장 널리 쓰이는 분포&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;&quot;이항분포는 성공과 실패의 지도를 그려주는 지도예요.&lt;br /&gt;한 번의 결과보다, 전체의 패턴을 보는 시선이랍니다.&quot;&lt;/blockquote&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;</description>
      <category>Statistics/기초 통계</category>
      <category>Ai</category>
      <category>기초통계학</category>
      <category>데이터분석</category>
      <category>데이터사이언스</category>
      <category>분산</category>
      <category>성광확률</category>
      <category>이항분포</category>
      <category>품질</category>
      <category>확률분포</category>
      <author>Allen93</author>
      <guid isPermaLink="true">https://allensdatablog.tistory.com/462</guid>
      <comments>https://allensdatablog.tistory.com/entry/6-%EC%9D%B4%ED%95%AD%EB%B6%84%ED%8F%AC-%EC%84%B1%EA%B3%B5%EA%B3%BC-%EC%8B%A4%ED%8C%A8#entry462comment</comments>
      <pubDate>Fri, 19 Dec 2025 19:46:25 +0900</pubDate>
    </item>
    <item>
      <title>5. 확률변수와 기댓값 - 평균이 아닌, '기대할 수 있는 세상'</title>
      <link>https://allensdatablog.tistory.com/entry/5-%ED%99%95%EB%A5%A0%EB%B3%80%EC%88%98%EC%99%80-%EA%B8%B0%EB%8C%93%EA%B0%92-%ED%8F%89%EA%B7%A0%EC%9D%B4-%EC%95%84%EB%8B%8C-%EA%B8%B0%EB%8C%80%ED%95%A0-%EC%88%98-%EC%9E%88%EB%8A%94-%EC%84%B8%EC%83%81</link>
      <description>&lt;p&gt;&lt;figure class=&quot;imageblock alignCenter&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;1024&quot; data-origin-height=&quot;1024&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/Xr59i/dJMcakzqhe6/tTiEswpqtrQLjZyi24Got0/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/Xr59i/dJMcakzqhe6/tTiEswpqtrQLjZyi24Got0/img.png&quot; data-alt=&quot;기대값&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/Xr59i/dJMcakzqhe6/tTiEswpqtrQLjZyi24Got0/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2FXr59i%2FdJMcakzqhe6%2FtTiEswpqtrQLjZyi24Got0%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;508&quot; height=&quot;508&quot; data-origin-width=&quot;1024&quot; data-origin-height=&quot;1024&quot;/&gt;&lt;/span&gt;&lt;figcaption&gt;기대값&lt;/figcaption&gt;
&lt;/figure&gt;
&lt;/p&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;1. 확률이 '가능성의 언어'라면,&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;확률변수는 그 언어를 숫자로 번역한 존재입니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;확률변수(random variable)는 이름이 조금 헷갈려요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&quot;랜덤한 변수&quot;라기보다,&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;&quot;확률도 정의된 세상에서 우리가 관심 있는 값을 숫자로 표현한 도구&quot;&lt;br /&gt;라고 보는 게 더 정확합니다.&lt;/blockquote&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;예를 들어 동전을 던질 때,&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;앞면 -&amp;gt; 1점&lt;/li&gt;
&lt;li&gt;뒷면 -&amp;gt; 0점&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;으로 두면, 동전 던지기는 &quot;1 또는 0을 내는 확률변수&quot;가 됩니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;즉, 세상의 불확실한 사건을 숫자로 바꾸는 일.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이게 확률변수의 역할이에요.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;2. 확률변수의 두 가지 종류&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;구분&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 설명&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;예시&lt;/b&gt;&lt;/p&gt;
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody&gt;
&lt;tr&gt;
&lt;td&gt;&lt;b&gt;이산형 (Discrete)&lt;/b&gt;&lt;/td&gt;
&lt;td&gt;셀 수 있는 값만 가짐&lt;/td&gt;
&lt;td&gt;주사위 눈(1~6), 고장 횟수&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;&lt;b&gt;연속형 (Continuous)&lt;/b&gt;&lt;/td&gt;
&lt;td&gt;특정 구간 내의 모든 값 가능&lt;/td&gt;
&lt;td&gt;자동차 엔진 수명(3000~3200시간)&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이 구분이 중요한 이유는,&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;확률을 셀 떄 방식이 달라지기 때문이에요.&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;&lt;b&gt;이산형&lt;/b&gt; -&amp;gt; 각 경우의 확률을 더함&lt;/li&gt;
&lt;li&gt;&lt;b&gt;연속형&lt;/b&gt; -&amp;gt; 확률밀도함수(PDF)를 면적으로 계산&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;하지만 본질은 같습니다.&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;&quot;값이 클수록 얼마나 자주 일어나는가&quot;를 표현한다는 점이에요.&lt;/blockquote&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;3. 기대값, 그 이름의 오해&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이제 핵심으로 들어가죠.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p&gt;&lt;figure class=&quot;imageblock alignLeft&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;171&quot; data-origin-height=&quot;47&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/bIm4m1/dJMcaeFYq3N/EWmJZMYTUcKmFRxWIWtA8k/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/bIm4m1/dJMcaeFYq3N/EWmJZMYTUcKmFRxWIWtA8k/img.png&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/bIm4m1/dJMcaeFYq3N/EWmJZMYTUcKmFRxWIWtA8k/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2FbIm4m1%2FdJMcaeFYq3N%2FEWmJZMYTUcKmFRxWIWtA8k%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;171&quot; height=&quot;47&quot; data-origin-width=&quot;171&quot; data-origin-height=&quot;47&quot;/&gt;&lt;/span&gt;&lt;/figure&gt;
&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;기댓값(Expected Value)은 말 그대로&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&quot;이 확률변수를 수없이 반복했을 때 평균적으로 기대되는 값&quot;이에요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;하지만 여기서 조심해야 할 부분이 있어요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;기댓값은 우리가 실제로 얻는 값이 아닙니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;예를 들어, 주사위를 던질 때의 기댓값을 계산해 보죠.&lt;/p&gt;
&lt;p&gt;&lt;figure class=&quot;imageblock alignLeft&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;313&quot; data-origin-height=&quot;36&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/CRcHS/dJMcadfZLVc/bMamTQomE8vuLkE4zHk5U0/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/CRcHS/dJMcadfZLVc/bMamTQomE8vuLkE4zHk5U0/img.png&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/CRcHS/dJMcadfZLVc/bMamTQomE8vuLkE4zHk5U0/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2FCRcHS%2FdJMcadfZLVc%2FbMamTQomE8vuLkE4zHk5U0%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;313&quot; height=&quot;36&quot; data-origin-width=&quot;313&quot; data-origin-height=&quot;36&quot;/&gt;&lt;/span&gt;&lt;/figure&gt;
&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;그런데 주사위를 던져서 3.5가 나온 적 있나요?&lt;br /&gt;없죠.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;기댓값은&lt;b&gt; &quot;장기적으로 평균이 수렴하는 지점&quot;,&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;즉, 현실의 한 번이 아니라 &quot;무한히 반복된 세상&quot;의 중심이에요.&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;기댓값 = &quot;이 게임을 계속했을 때 내가 결국 수렴하게 될 수익(혹은 손실)&quot;&lt;/blockquote&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;4. 현실 속 기댓값의 의미&lt;/h3&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;&lt;b&gt;품질관리 :&lt;/b&gt; 불량률이 2%라면, 100개 중 평균 2개는 불량.&lt;/li&gt;
&lt;li&gt;&lt;b&gt;보험 :&lt;/b&gt; 사고 확률이 1%, 보상금 100만 원 -&amp;gt; 기댓값 = 1만 원 -&amp;gt; 보험료 산정의 기초.&lt;/li&gt;
&lt;li&gt;&lt;b&gt;마케팅 :&lt;/b&gt; 클릭률 0.3%, 클릭당 매출 1000원 -&amp;gt; 기대수익 = 3월/노출.&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;즉, 기댓값은 단순히 '평균'이 아니라&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;결정과 예측의 기준선&lt;/b&gt;이에요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;확률적 세상에서 '합리적인 판단'을 위한 나침반 같은 존재죠.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;5. 분산과 기댓값의 관계&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;기댓값이 중심이라면,&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;분산은 그 중심 주위를 도는 &lt;b&gt;흔들림의 크기예요.&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p&gt;&lt;figure class=&quot;imageblock alignLeft&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;222&quot; data-origin-height=&quot;42&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/dACpLk/dJMcaa4DZNb/8BckdIX4NG9SdL2zc8uGck/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/dACpLk/dJMcaa4DZNb/8BckdIX4NG9SdL2zc8uGck/img.png&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/dACpLk/dJMcaa4DZNb/8BckdIX4NG9SdL2zc8uGck/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2FdACpLk%2FdJMcaa4DZNb%2F8BckdIX4NG9SdL2zc8uGck%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;222&quot; height=&quot;42&quot; data-origin-width=&quot;222&quot; data-origin-height=&quot;42&quot;/&gt;&lt;/span&gt;&lt;/figure&gt;
&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이 식은 외워두면 좋아요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이 안에 통계의 감각이 다 들어 있거든요.&lt;/p&gt;
&lt;p&gt;&lt;figure class=&quot;imageblock alignLeft&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;253&quot; data-origin-height=&quot;111&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/ckBLGd/dJMcajUOKbr/1rb2PxzvjLhGfc4GAZ4gg0/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/ckBLGd/dJMcajUOKbr/1rb2PxzvjLhGfc4GAZ4gg0/img.png&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/ckBLGd/dJMcajUOKbr/1rb2PxzvjLhGfc4GAZ4gg0/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2FckBLGd%2FdJMcajUOKbr%2F1rb2PxzvjLhGfc4GAZ4gg0%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;253&quot; height=&quot;111&quot; data-origin-width=&quot;253&quot; data-origin-height=&quot;111&quot;/&gt;&lt;/span&gt;&lt;/figure&gt;
&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;즉, 분산은 &quot;기대에서 얼마나 벗어나는가&quot;의 평균이에요.&lt;/blockquote&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;그래서 분산이 작은 데이터는 안정적이고,&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;분산이 큰 데이터는 위험(리스크)이 커요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;6. 확률의 감각을 길러주는 작은 실험&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;상상해 봅시다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;동전 한 개를 10번 던졌을 때 앞면이 몇 번 나올까요?&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;기댓값은 10 X 0.5 = 5.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;하지만 실제로는 3번, 7번, 4번 등 매번 달라요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이 차이가 바로 확률의 현실이에요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;확률이란 건 &quot;기댓값 근천에서 흔들리는 삶&quot;이에요.&lt;br /&gt;통계는 그 흔들림을 받아들이고 설명하는 언어죠.&lt;/blockquote&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;7. 한 장 요약&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;개념&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 의미&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;포인트&lt;/b&gt;&lt;/p&gt;
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody&gt;
&lt;tr&gt;
&lt;td&gt;확률변수&lt;/td&gt;
&lt;td&gt;사건을 수치로 표현한 도구&lt;/td&gt;
&lt;td&gt;불확실성을 숫자로 만든다&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;이산형 vs 연속형&lt;/td&gt;
&lt;td&gt;셀 수 있는가 여부&lt;/td&gt;
&lt;td&gt;계산 방식은 다르지만 본질은 동일&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;기댓값&lt;/td&gt;
&lt;td&gt;장기적으로 기대되는 평균&lt;/td&gt;
&lt;td&gt;현실의 값이 아니라 확률적 중심&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;분산&lt;/td&gt;
&lt;td&gt;기댓값 주변의 흔들림&lt;/td&gt;
&lt;td&gt;위험과 불확실성의 척도&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;핵심 감각&lt;/td&gt;
&lt;td&gt;확률은 한 번이 아니라 반복의 언어&lt;/td&gt;
&lt;td&gt;통계는 그 반복의 패턴을 읽는 기술&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style1&quot;&gt;&lt;span style=&quot;font-family: 'Noto Serif KR';&quot;&gt;&quot;기댓값은 단 한 번의 결과가 아니라,&lt;/span&gt;&lt;br /&gt;&lt;span style=&quot;font-family: 'Noto Serif KR';&quot;&gt;세상을 백 번 본 사람의 시선이에요.&quot;&lt;/span&gt;&lt;/blockquote&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;</description>
      <category>Statistics/기초 통계</category>
      <category>Ai</category>
      <category>기댓값</category>
      <category>기초통계학</category>
      <category>데이터분석</category>
      <category>데이터사이언스</category>
      <category>분산</category>
      <category>통계</category>
      <category>확률변수</category>
      <author>Allen93</author>
      <guid isPermaLink="true">https://allensdatablog.tistory.com/461</guid>
      <comments>https://allensdatablog.tistory.com/entry/5-%ED%99%95%EB%A5%A0%EB%B3%80%EC%88%98%EC%99%80-%EA%B8%B0%EB%8C%93%EA%B0%92-%ED%8F%89%EA%B7%A0%EC%9D%B4-%EC%95%84%EB%8B%8C-%EA%B8%B0%EB%8C%80%ED%95%A0-%EC%88%98-%EC%9E%88%EB%8A%94-%EC%84%B8%EC%83%81#entry461comment</comments>
      <pubDate>Tue, 16 Dec 2025 09:51:30 +0900</pubDate>
    </item>
    <item>
      <title>4. 확률의 직관 - 불확실함을 다루는 우리의 언어</title>
      <link>https://allensdatablog.tistory.com/entry/4-%ED%99%95%EB%A5%A0%EC%9D%98-%EC%A7%81%EA%B4%80-%EB%B6%88%ED%99%95%EC%8B%A4%ED%95%A8%EC%9D%84-%EB%8B%A4%EB%A3%A8%EB%8A%94-%EC%9A%B0%EB%A6%AC%EC%9D%98-%EC%96%B8%EC%96%B4</link>
      <description>&lt;p&gt;&lt;figure class=&quot;imageblock alignLeft&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;1024&quot; data-origin-height=&quot;1024&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/bKpuP4/dJMcaiBBobm/KtNh2ubiLQRLqDX2stxhA1/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/bKpuP4/dJMcaiBBobm/KtNh2ubiLQRLqDX2stxhA1/img.png&quot; data-alt=&quot;확률&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/bKpuP4/dJMcaiBBobm/KtNh2ubiLQRLqDX2stxhA1/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2FbKpuP4%2FdJMcaiBBobm%2FKtNh2ubiLQRLqDX2stxhA1%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;601&quot; height=&quot;1024&quot; data-origin-width=&quot;1024&quot; data-origin-height=&quot;1024&quot;/&gt;&lt;/span&gt;&lt;figcaption&gt;확률&lt;/figcaption&gt;
&lt;/figure&gt;
&lt;/p&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;1. 확률은 '예측'이 아니라 '태도'입니다.&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;출근길에 하늘이 잔뜩 하려 있고 비가 올 확률이 70%라고 합니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이때 우리는 종종 이렇게 생각하죠.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;&quot;70%면 비 오겠네.&quot;&lt;br /&gt;&quot;30%면 안 올 수도 있잖아?&quot;&lt;/blockquote&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;그런데 확률이란 건 &lt;b&gt;&quot;오늘&quot;의 날씨를 말하는 게 아니에요.&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&quot;이런 조건의 날씨가 100번 있었다면, 그중 70번은 비가 왔다&quot;는 의미죠.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;즉, 확률은 &lt;b&gt;'단 한 번의 사건'이 아니라 '반복되는 세상'을 보는 언어예요.&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이걸 감으로 잡으면,&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&quot;확률이 높다/낮다&quot;는 말이 단순한 수치가 아니라&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&quot;얼마나 일관된 패턴인가&quot;를 말한다는 걸 알게 됩니다.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;2. 확률은 결국 '가능성의 크기'를 재는 도구&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;확률의 정의는 간단합니다.&lt;/p&gt;
&lt;p&gt;&lt;figure class=&quot;imageblock alignLeft&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;263&quot; data-origin-height=&quot;60&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/wtGnR/dJMcaezcyCi/kX05R0z1Aop7NIwueWccN1/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/wtGnR/dJMcaezcyCi/kX05R0z1Aop7NIwueWccN1/img.png&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/wtGnR/dJMcaezcyCi/kX05R0z1Aop7NIwueWccN1/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2FwtGnR%2FdJMcaezcyCi%2FkX05R0z1Aop7NIwueWccN1%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;263&quot; height=&quot;60&quot; data-origin-width=&quot;263&quot; data-origin-height=&quot;60&quot;/&gt;&lt;/span&gt;&lt;/figure&gt;
&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;예를 들어 동전을 던졌을 때&amp;nbsp;앞면이 나올 확률은 1/2.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;하지만 여기서 중요한 건 수식보다 &lt;b&gt;사고방식이에요.&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;확률은 이렇게 세 단계를 밟아요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;1. 가능한 모든 결과를 상상한다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;2. 그중 내가 관심 있는 사건(A)을 정한다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;3. 그 사건이 얼마나 &quot;드물지 않은가&quot;를 비율로 표현한다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;즉,&lt;b&gt; &quot;예측&quot;&lt;/b&gt;보다 &lt;b&gt;&quot;세상 구조를 이해하는 도구&quot;&lt;/b&gt;라고 생각해요.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;3. 확률이 헷갈리는 이유 - '사람의 직관'은 확률을 싫어한다&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;사람의 뇌는 확률 계산에 약해요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;대신 &lt;b&gt;이야기(서사)&lt;/b&gt;에 훨씬 민감합니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;예를 들어,&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;&quot;교통사고로 사망할 확률은 0.001%입니다.&quot;&lt;br /&gt;&quot;이 도로에서는 매년 몇 명이 사고로 목숨을 잃어요.&quot;&lt;/blockquote&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;두 문장은 같은 정보지만,&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;두 번째 문장이 훨씬 실제적으로 느껴지죠.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;또 이런 착각도 자주 생겨요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;&quot;동전을 5번 던졌는데 계속 앞면이 나왔어. 다음엔 뒷면이 나오겠지?&quot;&lt;/blockquote&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;아니요. 여전히 1/2입니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;과거의 사건이 미래의 확률을 바꾸지 않는다-&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이게 독립사건(independent)의 핵심이죠.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;&lt;b&gt;확률 감각 = &quot;과거는 이미 지나갔고, 기대는 항상 현재 기준으로 다시 계산한다.&quot;&lt;/b&gt;&lt;/blockquote&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;4. 조건부 확률 - &quot;주어진 정보가 확률을 바꾼다&quot;&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;조금 더 깊게 들어가 볼게요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;조건부 확률(Conditional Probability)&lt;/b&gt;은 말 그대로&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&quot;어떤 조건이 주어졌을 때, 그 안에서 다시 계산하는 확률&quot;이에요.&lt;/p&gt;
&lt;p&gt;&lt;figure class=&quot;imageblock alignLeft&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;174&quot; data-origin-height=&quot;62&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/njU89/dJMcafdN5E9/10PJuKFhmdgOz8lo1K30LK/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/njU89/dJMcafdN5E9/10PJuKFhmdgOz8lo1K30LK/img.png&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/njU89/dJMcafdN5E9/10PJuKFhmdgOz8lo1K30LK/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2FnjU89%2FdJMcafdN5E9%2F10PJuKFhmdgOz8lo1K30LK%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;174&quot; height=&quot;62&quot; data-origin-width=&quot;174&quot; data-origin-height=&quot;62&quot;/&gt;&lt;/span&gt;&lt;/figure&gt;
&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;예를 들어 자동차의 센서 경고등이 켜졌을 때,&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;실제로 고장이 발생할 확률을 구한다고 합시다.&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;전체 고장 확률 P(A) = 2%&lt;/li&gt;
&lt;li&gt;경고등이 켜질 확률&amp;nbsp; P(B) = 10%&lt;/li&gt;
&lt;li&gt;경고등이 켜졌고 실제 교장인 경우 &lt;span aria-hidden=&quot;true&quot;&gt;P(A&amp;cap;B)&lt;/span&gt; = 1%&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;그럼&lt;/p&gt;
&lt;p&gt;&lt;figure class=&quot;imageblock alignLeft&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;184&quot; data-origin-height=&quot;62&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/cNMQDE/dJMcagRjU3a/XYirxkj3rLCxovWDCZicik/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/cNMQDE/dJMcagRjU3a/XYirxkj3rLCxovWDCZicik/img.png&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/cNMQDE/dJMcagRjU3a/XYirxkj3rLCxovWDCZicik/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2FcNMQDE%2FdJMcagRjU3a%2FXYirxkj3rLCxovWDCZicik%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;184&quot; height=&quot;62&quot; data-origin-width=&quot;184&quot; data-origin-height=&quot;62&quot;/&gt;&lt;/span&gt;&lt;/figure&gt;
&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;즉, 경고등이 켜졌을 때 고장일 가능성은 10%입니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;단순히 2%보다 높죠.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이게 바로 조건부 확률이 주는 힘이에요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;&quot;새로운 정보가 들어오면 확률은 다시 업데이트된다.&quot;&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이 원리가 바로&lt;b&gt; 베이즈 정리(Bayes' theorem)&lt;/b&gt;의 근간이에요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;(이건 다음 글에서 풀어보겠습니다.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;5. 확률과 일상 - 우리가 이미 쓰고 있는 언어&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;비 오는 확률 70% -&amp;gt; &lt;b&gt;기상 데이터의 누적 패턴&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;불량률 1.5% -&amp;gt; &lt;b&gt;공정의 일관성&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&quot;이 버튼을 눌렀을 때 작동할 확률 98%&quot; -&amp;gt; &lt;b&gt;신뢰성(reliability)&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&quot;이 광고 클릭 확률 0.3%&quot; -&amp;gt; &lt;b&gt;예측 모델의 성능&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;확률은 사실 &lt;b&gt;모든 의사결정의 바탕&lt;/b&gt;이에요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;다만 수학처럼 보이기 때문에 어렵게 느껴질 뿐이죠.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;6. 실무 감각 한 스푼&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;1. '확률이 낮다'는 말은 '불가능하다'는 뜻이 아니다.&lt;/b&gt;&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;0.1%의 사건도 천 번 중 한 번은 일어나요.&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;2. 확률은 항상 '조건'과 함께 봐야 한다.&lt;/b&gt;&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;&quot;고장이 날 확률 2%&quot; -&amp;gt; &quot;온도 35&amp;deg;C 이상일 때 2%인가?&quot;를 확인&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;3. 확률은 항상 '평균'과 다르다.&lt;/b&gt;&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;확률은 발생 가능성, 평균은 결과의 중심. 혼동하지 말 것.&lt;/li&gt;
&lt;/ul&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;7. 한 장 요약&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;개념&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;의미&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;핵심 포인트&lt;/b&gt;&lt;/p&gt;
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody&gt;
&lt;tr&gt;
&lt;td&gt;확률&lt;/td&gt;
&lt;td&gt;사건이 일어날 가능성의 비율&lt;/td&gt;
&lt;td&gt;&amp;ldquo;한 번이 아니라, 반복의 세상&amp;rdquo;&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;독립사건&lt;/td&gt;
&lt;td&gt;서로 영향을 주지 않는 사건&lt;/td&gt;
&lt;td&gt;동전의 앞뒤는 기억력이 없다&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;조건부 확률&lt;/td&gt;
&lt;td&gt;어떤 조건 아래의 확률&lt;/td&gt;
&lt;td&gt;새로운 정보로 업데이트&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;사람의 직관 vs 확률&lt;/td&gt;
&lt;td&gt;감정은 사건을 과대평가&lt;/td&gt;
&lt;td&gt;숫자는 담담하다&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;실무에서의 확률&lt;/td&gt;
&lt;td&gt;불량률, 클릭률, 예측모델 정확도&lt;/td&gt;
&lt;td&gt;세상을 수치로 이해하는 언어&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;</description>
      <category>Statistics/기초 통계</category>
      <category>Ai</category>
      <category>기초통계학</category>
      <category>데이터분석</category>
      <category>데이터사이언스</category>
      <category>베이즈감각</category>
      <category>조건부확률</category>
      <category>통계입문</category>
      <category>확률</category>
      <author>Allen93</author>
      <guid isPermaLink="true">https://allensdatablog.tistory.com/460</guid>
      <comments>https://allensdatablog.tistory.com/entry/4-%ED%99%95%EB%A5%A0%EC%9D%98-%EC%A7%81%EA%B4%80-%EB%B6%88%ED%99%95%EC%8B%A4%ED%95%A8%EC%9D%84-%EB%8B%A4%EB%A3%A8%EB%8A%94-%EC%9A%B0%EB%A6%AC%EC%9D%98-%EC%96%B8%EC%96%B4#entry460comment</comments>
      <pubDate>Sat, 13 Dec 2025 09:51:44 +0900</pubDate>
    </item>
    <item>
      <title>3. 요약통계의 진짜 의미 : 평균, 분산, 사분위</title>
      <link>https://allensdatablog.tistory.com/entry/%EC%9A%94%EC%95%BD%ED%86%B5%EA%B3%84%EC%9D%98-%EC%A7%84%EC%A7%9C-%EC%9D%98%EB%AF%B8-%ED%8F%89%EA%B7%A0-%EB%B6%84%EC%82%B0-%EC%82%AC%EB%B6%84%EC%9C%84</link>
      <description>&lt;p&gt;&lt;figure class=&quot;imageblock alignLeft&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;1024&quot; data-origin-height=&quot;1024&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/bEsgV0/dJMcac9dAT3/kNLjT3wF3fdTFApRY6z1R1/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/bEsgV0/dJMcac9dAT3/kNLjT3wF3fdTFApRY6z1R1/img.png&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/bEsgV0/dJMcac9dAT3/kNLjT3wF3fdTFApRY6z1R1/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2FbEsgV0%2FdJMcac9dAT3%2FkNLjT3wF3fdTFApRY6z1R1%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;537&quot; height=&quot;537&quot; data-origin-width=&quot;1024&quot; data-origin-height=&quot;1024&quot;/&gt;&lt;/span&gt;&lt;/figure&gt;
&lt;/p&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;1. &quot;평균 100점&quot;의 함정&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;한 반 한색들의 시험 평균이 100점이라고 해봅시다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;그 말을 듣고 &quot;다들 완벽했네!&quot; 라고 생각했다면, 아직 통계의 감각이 덜 잡힌 거예요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;왜냐하면, 아래 두 상황은 모두 평균 100점이거든요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;학생 A&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;학생 B&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 학생 C&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 학생 D&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 학생 E&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;평균&lt;/b&gt;&lt;/p&gt;
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody&gt;
&lt;tr&gt;
&lt;td&gt;100&lt;/td&gt;
&lt;td&gt;100&lt;/td&gt;
&lt;td&gt;100&lt;/td&gt;
&lt;td&gt;100&lt;/td&gt;
&lt;td&gt;100&lt;/td&gt;
&lt;td&gt;100&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;0&lt;/td&gt;
&lt;td&gt;0&lt;/td&gt;
&lt;td&gt;100&lt;/td&gt;
&lt;td&gt;200&lt;/td&gt;
&lt;td&gt;200&lt;/td&gt;
&lt;td&gt;100&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;평균은 같지만, &lt;b&gt;상황은 완전히 다르죠.&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;첫 번째 반은 모두 일정한 수준이지만,&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;두 번째 반은 '극단'이 섞여 있습니다.(물론 시험 점수는 보통 100점 만점이지만요,)&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이게 바로 &lt;b&gt;평균이 모든 걸 말해주지 못하는 이유예요.&lt;/b&gt;&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;2. 분산과 표준편차 : 평균이 말하지 못한 이야기&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;분산(Variance)은 데이터가 평균을 기준으로 얼마나 퍼져 있는가를 나타내요.&lt;/p&gt;
&lt;p&gt;&lt;figure class=&quot;imageblock alignLeft&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;211&quot; data-origin-height=&quot;64&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/b0sFbL/dJMcaiuPvyR/0M0XHulaWxwTfHJ6EzKLN1/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/b0sFbL/dJMcaiuPvyR/0M0XHulaWxwTfHJ6EzKLN1/img.png&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/b0sFbL/dJMcaiuPvyR/0M0XHulaWxwTfHJ6EzKLN1/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2Fb0sFbL%2FdJMcaiuPvyR%2F0M0XHulaWxwTfHJ6EzKLN1%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;211&quot; height=&quot;64&quot; data-origin-width=&quot;211&quot; data-origin-height=&quot;64&quot;/&gt;&lt;/span&gt;&lt;/figure&gt;
&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;말은 복잡하지만, 단순해요.&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;평균에서 멀리 떨어진 값이 많을수록 분산이 커진다.&lt;/blockquote&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;표준편차(Stanradr Deviation)는 분산의 제곱근이에요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;단위가 원래 데이터와 같아져서 비교하기 쉬워요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;데이터&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;평균&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;표준편차&amp;nbsp; &amp;nbsp; &amp;nbsp;해석&lt;/b&gt;&lt;/p&gt;
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody&gt;
&lt;tr&gt;
&lt;td&gt;[100,100,100,100,100]&lt;/td&gt;
&lt;td&gt;100&lt;/td&gt;
&lt;td&gt;0&lt;/td&gt;
&lt;td&gt;완벽히 균일&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;[0,0,100,200,200]&lt;/td&gt;
&lt;td&gt;100&lt;/td&gt;
&lt;td&gt;89&lt;/td&gt;
&lt;td&gt;극단적으로 퍼져 있음&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;표준편차가 크다는 건 &quot;평균 근처에 데이터가 적다&quot;는 뜻이에요.&lt;br /&gt;즉, 데이터의 일관성(consistency)을 보는 지표라고 생각하면 됩니다.&lt;/blockquote&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;3. 분포를 보는 눈 : 사분위와 이상치&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;분산은 좋지만, 극단적인 값에 너무 민감해요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;그래서 통계에서는 &lt;b&gt;사분위수(Quartile)&lt;/b&gt;라는 개념을 함께 봅니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;데이터를 크기 순으로 나누었을 때,&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;Q1: 하위 25%&lt;/li&gt;
&lt;li&gt;Q2: 중간값(50%)&lt;/li&gt;
&lt;li&gt;Q3: 상위75%&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;그리고 사분위 범위(IQR) = Q3-Q1&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이 범위를 벗어난 값은 이상치(outlier)로 볼 수 있죠.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이건 단순히 '버릴 값'을 의미하진 않아요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;오히려 &lt;b&gt;평균이 놓친 흥미로운 데이터&lt;/b&gt;일 수도 있습니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;예를 들어 자동차 엔진 수명 데이터를 보면,&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;대부분은 3,000 ~ 3,200시간에서 고장나지만&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;어떤 건 5,000시간 넘게 버텨요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;그 한두 개가 이상치처럼 보이지만, 사실은 &quot;특별히 내구성이 좋은 케이스&quot;일 수도 있죠.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;그래서 통계적 감각이란 건, 단순히 값을 버리거나 남기는 게 아니라 &quot;왜 이런 값이 생겼을까?&quot;를 묻는 태도예요.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;4. 평균, 중앙값, 최빈값 - 세 얼굴의 중심&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;데이터의 중심은 꼭 평균만 있는게 아닙니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;지표&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 설명&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 특징&lt;/b&gt;&lt;/p&gt;
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody&gt;
&lt;tr&gt;
&lt;td&gt;&lt;b&gt;평균 (Mean)&lt;/b&gt;&lt;/td&gt;
&lt;td&gt;모든 값을 더해 나눈 값&lt;/td&gt;
&lt;td&gt;극단값에 민감&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;&lt;b&gt;중앙값 (Median)&lt;/b&gt;&lt;/td&gt;
&lt;td&gt;정렬했을 때 가운데 값&lt;/td&gt;
&lt;td&gt;극단값의 영향을 거의 안 받음&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;&lt;b&gt;최빈값 (Mode)&lt;/b&gt;&lt;/td&gt;
&lt;td&gt;가장 자주 나타나는 값&lt;/td&gt;
&lt;td&gt;범주형 데이터에 유용&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;예를 들어 &lt;b&gt;월급 데이터&lt;/b&gt;를 생각해볼께요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;극소수의 고액 연봉자가 있으면 평균이 확 올라가요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;하지만 대부분 사람들의 현실에 가까운 건 중앙값이에요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;그래서 뉴스 기사에서 &quot;평균 연봉 5,000만원&quot;이란 말보다&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&quot;중앙값 3,500만원&quot;이 훨씬 더 현실을 잘 말해줍니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;평균은 &quot;수학적인 중심&quot;이고,&lt;br /&gt;중앙값은 &quot;그 값들의 실제적인 중심&quot; 이에요.&lt;/blockquote&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;5. 실무에선?&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;1. 리포트엔 평균 + 표준편차를 함께 묶어서,&lt;/b&gt;&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;&quot;평균 80점, 표준편차 5점&quot; 이렇게 써야 &quot;데이터가 얼마나 퍼져 있나&quot; 감이 와요.&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;2. 극단값이 있다면, 중앙값으로&lt;/b&gt;&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;&quot;평균 1,000시간, 중앙값 850시간&quot; -&amp;gt; 한눈에 데이터가 오른쪽으로 긴 분포임을 암시.&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;3. 분포 시각화 습관&lt;/b&gt;&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;히스토그램, 박스플롯으로 분포를 보는 게 숫자보다 훨씬 빠릅니다.&lt;/li&gt;
&lt;/ul&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;6. 한 장 요약&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;개념&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 역할&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;해석&lt;/b&gt;&lt;/p&gt;
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody&gt;
&lt;tr&gt;
&lt;td&gt;평균&lt;/td&gt;
&lt;td&gt;중심의 수학적 표현&lt;/td&gt;
&lt;td&gt;대표값이지만 극단값에 취약&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;분산/표준편차&lt;/td&gt;
&lt;td&gt;퍼짐의 정도&lt;/td&gt;
&lt;td&gt;데이터 일관성 측정&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;사분위수/IQR&lt;/td&gt;
&lt;td&gt;분포 요약&lt;/td&gt;
&lt;td&gt;이상치 탐지 및 분포 비대칭성 확인&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;중앙값&lt;/td&gt;
&lt;td&gt;실제 중심&lt;/td&gt;
&lt;td&gt;극단값에 강함&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;요약통계의 본질&lt;/td&gt;
&lt;td&gt;&amp;ldquo;숫자의 이야기&amp;rdquo;&lt;/td&gt;
&lt;td&gt;단순한 계산이 아니라 해석의 출발점&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;&lt;b&gt;통계는 계산보다 '읽는 기술'이에요.&lt;/b&gt;&lt;br /&gt;&lt;b&gt;숫자 뒤의 맥락을 읽을 줄 알면, 이미 절반은 배운 겁니다.&lt;/b&gt;&lt;/blockquote&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;</description>
      <category>Statistics/기초 통계</category>
      <category>Eda</category>
      <category>기초통계학</category>
      <category>데이터분석</category>
      <category>데이터사이언스</category>
      <category>데이터요약</category>
      <category>요약통계</category>
      <category>평균과분산</category>
      <category>표준편차</category>
      <author>Allen93</author>
      <guid isPermaLink="true">https://allensdatablog.tistory.com/459</guid>
      <comments>https://allensdatablog.tistory.com/entry/%EC%9A%94%EC%95%BD%ED%86%B5%EA%B3%84%EC%9D%98-%EC%A7%84%EC%A7%9C-%EC%9D%98%EB%AF%B8-%ED%8F%89%EA%B7%A0-%EB%B6%84%EC%82%B0-%EC%82%AC%EB%B6%84%EC%9C%84#entry459comment</comments>
      <pubDate>Tue, 9 Dec 2025 09:37:24 +0900</pubDate>
    </item>
    <item>
      <title>머신러닝 모델을 평가할 때 Accuracy보다 먼저 봐야 할 것들</title>
      <link>https://allensdatablog.tistory.com/entry/%EB%A8%B8%EC%8B%A0%EB%9F%AC%EB%8B%9D-%EB%AA%A8%EB%8D%B8%EC%9D%84-%ED%8F%89%EA%B0%80%ED%95%A0-%EB%95%8C-Accuracy%EB%B3%B4%EB%8B%A4-%EB%A8%BC%EC%A0%80-%EB%B4%90%EC%95%BC-%ED%95%A0-%EA%B2%83%EB%93%A4</link>
      <description>&lt;p data-end=&quot;151&quot; data-start=&quot;42&quot; data-ke-size=&quot;size16&quot;&gt;모델을 처음 만들어보면, 대부분 Accuracy(정확도)에 집착합니다.&lt;br /&gt;&amp;ldquo;와, 정확도 95%야!&amp;rdquo; &amp;mdash; 숫자는 멋있죠.&lt;br /&gt;하지만 실제로는 이 95%가 &lt;b&gt;아무 의미 없을 수도&lt;/b&gt; 있습니다.&lt;/p&gt;
&lt;p data-end=&quot;243&quot; data-start=&quot;153&quot; data-ke-size=&quot;size16&quot;&gt;Accuracy는 유용하지만, &lt;b&gt;진실을 가려버리는 지표&lt;/b&gt;가 될 때가 많아요.&lt;br /&gt;특히 불균형 데이터(imbalanced data)에서는 더더욱 그렇습니다.&lt;/p&gt;
&lt;hr data-end=&quot;248&quot; data-start=&quot;245&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;271&quot; data-start=&quot;250&quot; data-ke-size=&quot;size26&quot;&gt;1️⃣ Accuracy의 함정&lt;/h2&gt;
&lt;p data-end=&quot;303&quot; data-start=&quot;272&quot; data-ke-size=&quot;size16&quot;&gt;Accuracy는 &amp;ldquo;전체 중 정답을 맞힌 비율&amp;rdquo;이죠.&lt;/p&gt;
&lt;p data-end=&quot;324&quot; data-start=&quot;305&quot; data-ke-size=&quot;size16&quot;&gt;예를 들어, 암 진단 데이터에서&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;388&quot; data-start=&quot;325&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;356&quot; data-start=&quot;325&quot;&gt;환자 1,000명 중 실제 암 환자는 10명뿐이고&lt;/li&gt;
&lt;li data-end=&quot;388&quot; data-start=&quot;357&quot;&gt;모델이 모두 &lt;b&gt;&amp;lsquo;암 아님&amp;rsquo;&lt;/b&gt;이라고 예측했다면?&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-end=&quot;465&quot; data-start=&quot;390&quot; data-ke-size=&quot;size16&quot;&gt;정확도는 무려 &lt;b&gt;99%&lt;/b&gt;입니다.&lt;br /&gt;하지만 정작 &lt;b&gt;진짜 암 환자 10명을 전부 놓쳤죠.&lt;/b&gt;&lt;br /&gt;이런 모델을 믿을 수 있을까요?&lt;/p&gt;
&lt;p data-end=&quot;542&quot; data-start=&quot;467&quot; data-ke-size=&quot;size16&quot;&gt;Accuracy는 전체 비율만 보기 때문에,&lt;br /&gt;&lt;b&gt;소수 클래스(중요하지만 드문 경우)&lt;/b&gt;를 완전히 무시해도 점수가 높게 나옵니다.&lt;/p&gt;
&lt;hr data-end=&quot;547&quot; data-start=&quot;544&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;577&quot; data-start=&quot;549&quot; data-ke-size=&quot;size26&quot;&gt;2️⃣ 먼저 봐야 할 건 &amp;ldquo;불균형&amp;rdquo;의 존재&lt;/h2&gt;
&lt;p data-end=&quot;618&quot; data-start=&quot;578&quot; data-ke-size=&quot;size16&quot;&gt;모델을 평가하기 전, 제일 먼저 확인해야 할 건 데이터의 분포입니다.&lt;/p&gt;
&lt;pre id=&quot;code_1761646265702&quot; class=&quot;python&quot; data-ke-language=&quot;python&quot; data-ke-type=&quot;codeblock&quot;&gt;&lt;code&gt;df['label'].value_counts(normalize=True)&lt;/code&gt;&lt;/pre&gt;
&lt;p data-end=&quot;737&quot; data-start=&quot;675&quot; data-ke-size=&quot;size16&quot;&gt;이렇게 클래스 비율을 보면,&lt;br /&gt;&amp;ldquo;내 데이터는 이미 9:1로 기울어져 있네?&amp;rdquo;&lt;br /&gt;를 금방 알 수 있습니다.&lt;/p&gt;
&lt;p data-end=&quot;780&quot; data-start=&quot;739&quot; data-ke-size=&quot;size16&quot;&gt;이 한 줄이 Accuracy를 신뢰할 수 있는지 판단하는 출발점이에요.&lt;/p&gt;
&lt;hr data-end=&quot;785&quot; data-start=&quot;782&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;829&quot; data-start=&quot;787&quot; data-ke-size=&quot;size26&quot;&gt;3️⃣ Precision과 Recall &amp;mdash; &amp;lsquo;무엇을 놓치고 있는가&amp;rsquo;&lt;/h2&gt;
&lt;p data-end=&quot;896&quot; data-start=&quot;830&quot; data-ke-size=&quot;size16&quot;&gt;Accuracy가 평균적인 성능이라면,&lt;br /&gt;Precision과 Recall은 &amp;ldquo;어디서 틀리고 있는가&amp;rdquo;를 보여줍니다.&lt;/p&gt;
&lt;div&gt;
&lt;div&gt;지표의미비유
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-end=&quot;1058&quot; data-start=&quot;898&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody data-end=&quot;1058&quot; data-start=&quot;938&quot;&gt;
&lt;tr data-end=&quot;1001&quot; data-start=&quot;938&quot;&gt;
&lt;td data-col-size=&quot;sm&quot; data-end=&quot;950&quot; data-start=&quot;938&quot;&gt;Precision&lt;/td&gt;
&lt;td data-end=&quot;974&quot; data-start=&quot;950&quot; data-col-size=&quot;sm&quot;&gt;맞췄다고 한 것 중에 실제로 맞은 비율&lt;/td&gt;
&lt;td data-end=&quot;1001&quot; data-start=&quot;974&quot; data-col-size=&quot;sm&quot;&gt;&amp;ldquo;잡은 고기 중 진짜 생선이 얼마나 되나&amp;rdquo;&lt;/td&gt;
&lt;/tr&gt;
&lt;tr data-end=&quot;1058&quot; data-start=&quot;1002&quot;&gt;
&lt;td data-col-size=&quot;sm&quot; data-end=&quot;1011&quot; data-start=&quot;1002&quot;&gt;Recall&lt;/td&gt;
&lt;td data-end=&quot;1035&quot; data-start=&quot;1011&quot; data-col-size=&quot;sm&quot;&gt;실제로 맞아야 할 것 중 얼마나 맞췄나&lt;/td&gt;
&lt;td data-end=&quot;1058&quot; data-start=&quot;1035&quot; data-col-size=&quot;sm&quot;&gt;&amp;ldquo;전체 생선 중 몇 마리를 잡았나&amp;rdquo;&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;/div&gt;
&lt;/div&gt;
&lt;p data-end=&quot;1161&quot; data-start=&quot;1060&quot; data-ke-size=&quot;size16&quot;&gt;의료, 보안, 이상탐지처럼 &lt;b&gt;놓치면 안 되는 경우&lt;/b&gt;는 Recall이 중요하고,&lt;br /&gt;스팸 필터, 광고 추천처럼 &lt;b&gt;잘못 탐지하면 곤란한 경우&lt;/b&gt;는 Precision이 중요하죠.&lt;/p&gt;
&lt;hr data-end=&quot;1166&quot; data-start=&quot;1163&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;1197&quot; data-start=&quot;1168&quot; data-ke-size=&quot;size26&quot;&gt;4️⃣ F1-score &amp;mdash; 균형을 보는 시선&lt;/h2&gt;
&lt;p data-end=&quot;1256&quot; data-start=&quot;1198&quot; data-ke-size=&quot;size16&quot;&gt;Precision과 Recall이 서로 엇갈릴 때,&lt;br /&gt;그 둘의 조화를 본 게 F1-score입니다.&lt;/p&gt;
&lt;pre id=&quot;code_1761646275662&quot; class=&quot;python&quot; data-ke-language=&quot;python&quot; data-ke-type=&quot;codeblock&quot;&gt;&lt;code&gt;from sklearn.metrics import f1_score
f1_score(y_true, y_pred)&lt;/code&gt;&lt;/pre&gt;
&lt;p data-end=&quot;1368&quot; data-start=&quot;1334&quot; data-ke-size=&quot;size16&quot;&gt;높을수록 &amp;ldquo;놓치지도, 과하지도 않은&amp;rdquo; 모델이라는 뜻이에요.&lt;/p&gt;
&lt;hr data-end=&quot;1373&quot; data-start=&quot;1370&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;1410&quot; data-start=&quot;1375&quot; data-ke-size=&quot;size26&quot;&gt;5️⃣ Confusion Matrix로 오답 패턴 보기&lt;/h2&gt;
&lt;p data-end=&quot;1443&quot; data-start=&quot;1411&quot; data-ke-size=&quot;size16&quot;&gt;숫자 하나보다 훨씬 많은 걸 알려주는 도표가 있습니다.&lt;/p&gt;
&lt;pre id=&quot;code_1761646284474&quot; class=&quot;python&quot; data-ke-language=&quot;python&quot; data-ke-type=&quot;codeblock&quot;&gt;&lt;code&gt;from sklearn.metrics import confusion_matrix
print(confusion_matrix(y_true, y_pred))&lt;/code&gt;&lt;/pre&gt;
&lt;p data-end=&quot;1656&quot; data-start=&quot;1545&quot; data-ke-size=&quot;size16&quot;&gt;이걸 시각화하면, 어떤 클래스에서 과하게 틀리는지 바로 보이죠.&lt;br /&gt;Accuracy가 높더라도 &lt;b&gt;오답이 특정 클래스에 몰려 있다면&lt;/b&gt;,&lt;br /&gt;그건 &amp;ldquo;잘 맞는 모델&amp;rdquo;이 아니라 &amp;ldquo;편향된 모델&amp;rdquo;입니다.&lt;/p&gt;
&lt;hr data-end=&quot;1661&quot; data-start=&quot;1658&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;1690&quot; data-start=&quot;1663&quot; data-ke-size=&quot;size26&quot;&gt;6️⃣ ROC와 AUC &amp;mdash; 예측의 민감도&lt;/h2&gt;
&lt;p data-end=&quot;1772&quot; data-start=&quot;1691&quot; data-ke-size=&quot;size16&quot;&gt;분류 임계값(threshold)을 바꿔가며 모델의 반응을 본 게 ROC곡선이고,&lt;br /&gt;그 아래 면적(AUC)이 1에 가까울수록 좋은 모델입니다.&lt;/p&gt;
&lt;p data-end=&quot;1869&quot; data-start=&quot;1774&quot; data-ke-size=&quot;size16&quot;&gt;이건 &amp;ldquo;모델이 얼마나 일관되게 구분을 잘 하는가&amp;rdquo;를 보여줍니다.&lt;br /&gt;Accuracy가 하나의 고정된 점이라면, AUC는 그 모델의 전체적인 성향을 보여주는 곡선이에요.&lt;/p&gt;
&lt;hr data-end=&quot;1874&quot; data-start=&quot;1871&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;1907&quot; data-start=&quot;1876&quot; data-ke-size=&quot;size26&quot;&gt;7️⃣ 결국 중요한 건 &amp;ldquo;무엇을 위해 평가하나&amp;rdquo;&lt;/h2&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;2031&quot; data-start=&quot;1908&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;1946&quot; data-start=&quot;1908&quot;&gt;불량품 탐지 모델이라면, &lt;b&gt;Recall&lt;/b&gt;이 더 중요하겠죠.&lt;/li&gt;
&lt;li data-end=&quot;1985&quot; data-start=&quot;1947&quot;&gt;추천 시스템이라면, &lt;b&gt;Precision&lt;/b&gt;을 높여야 합니다.&lt;/li&gt;
&lt;li data-end=&quot;2031&quot; data-start=&quot;1986&quot;&gt;고객 이탈 예측이라면, &lt;b&gt;F1-score&lt;/b&gt;로 균형을 보는 게 좋습니다.&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-end=&quot;2088&quot; data-start=&quot;2033&quot; data-ke-size=&quot;size16&quot;&gt;즉, 좋은 지표란 &amp;ldquo;문제의 목적&amp;rdquo;과 맞는 지표예요.&lt;br /&gt;Accuracy는 그중 하나일 뿐입니다.&lt;/p&gt;
&lt;hr data-end=&quot;2093&quot; data-start=&quot;2090&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;2107&quot; data-start=&quot;2095&quot; data-ke-size=&quot;size26&quot;&gt;8️⃣ 마무리&lt;/h2&gt;
&lt;p data-end=&quot;2159&quot; data-start=&quot;2108&quot; data-ke-size=&quot;size16&quot;&gt;Accuracy는 익숙하고 계산도 쉽지만,&lt;br /&gt;&lt;b&gt;문제의 맥락을 설명하지는 않습니다.&lt;/b&gt;&lt;/p&gt;
&lt;p data-end=&quot;2262&quot; data-start=&quot;2161&quot; data-ke-size=&quot;size16&quot;&gt;좋은 분석가는 숫자 하나에 만족하지 않고,&lt;br /&gt;그 숫자 뒤에 &amp;ldquo;무엇을 놓치고 있는가&amp;rdquo;를 먼저 봅니다.&lt;br /&gt;모델을 만든다는 건 결국, &lt;b&gt;데이터의 불균형을 이해하는 일&lt;/b&gt;이니까요.&lt;/p&gt;</description>
      <category>Machine Learning/머신러닝</category>
      <category>accuracy</category>
      <category>F1-score</category>
      <category>Precision</category>
      <category>recall</category>
      <category>데이터불균형</category>
      <category>머신러닝</category>
      <category>모델링</category>
      <category>모델평가</category>
      <author>Allen93</author>
      <guid isPermaLink="true">https://allensdatablog.tistory.com/458</guid>
      <comments>https://allensdatablog.tistory.com/entry/%EB%A8%B8%EC%8B%A0%EB%9F%AC%EB%8B%9D-%EB%AA%A8%EB%8D%B8%EC%9D%84-%ED%8F%89%EA%B0%80%ED%95%A0-%EB%95%8C-Accuracy%EB%B3%B4%EB%8B%A4-%EB%A8%BC%EC%A0%80-%EB%B4%90%EC%95%BC-%ED%95%A0-%EA%B2%83%EB%93%A4#entry458comment</comments>
      <pubDate>Sat, 6 Dec 2025 20:13:40 +0900</pubDate>
    </item>
    <item>
      <title>통계에서 p-value를 &amp;lsquo;감으로&amp;rsquo; 이해하는 법</title>
      <link>https://allensdatablog.tistory.com/entry/%ED%86%B5%EA%B3%84%EC%97%90%EC%84%9C-p-value%EB%A5%BC-%E2%80%98%EA%B0%90%EC%9C%BC%EB%A1%9C%E2%80%99-%EC%9D%B4%ED%95%B4%ED%95%98%EB%8A%94-%EB%B2%95</link>
      <description>&lt;p data-end=&quot;172&quot; data-start=&quot;32&quot; data-ke-size=&quot;size16&quot;&gt;p-value는 통계를 처음 배우는 사람들이 가장 자주 헷갈리는 개념 중 하나예요.&lt;br /&gt;수식으로 배우면 외워지긴 하는데, 정작 &lt;b&gt;언제 작고 언제 큰 게 중요한지&lt;/b&gt; 잘 안 와닿죠.&lt;br /&gt;그래서 이번엔 공식을 잠깐 내려두고, &amp;ldquo;감&amp;rdquo;으로 이해해볼게요.&lt;/p&gt;
&lt;hr data-end=&quot;177&quot; data-start=&quot;174&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;217&quot; data-start=&quot;179&quot; data-ke-size=&quot;size26&quot;&gt;1️⃣ p-value는 &amp;lsquo;우연일 확률&amp;rsquo;이다 (단, 조건부로)&lt;/h2&gt;
&lt;p data-end=&quot;241&quot; data-start=&quot;218&quot; data-ke-size=&quot;size16&quot;&gt;p-value는 이렇게 묻는 값이에요.&lt;/p&gt;
&lt;blockquote data-end=&quot;300&quot; data-start=&quot;242&quot; data-ke-style=&quot;style1&quot;&gt;
&lt;p data-end=&quot;300&quot; data-start=&quot;244&quot; data-ke-size=&quot;size16&quot;&gt;&amp;ldquo;내가 관찰한 결과가, &lt;b&gt;진짜로 아무 일도 일어나지 않았다고 가정했을 때&lt;/b&gt; 얼마나 희귀한가?&amp;rdquo;&lt;/p&gt;
&lt;/blockquote&gt;
&lt;p data-end=&quot;407&quot; data-start=&quot;302&quot; data-ke-size=&quot;size16&quot;&gt;예를 들어 동전을 던졌는데 연속으로 8번 앞면이 나왔다면,&lt;br /&gt;&amp;ldquo;이게 우연일 확률&amp;rdquo;을 계산한 게 p-value죠.&lt;br /&gt;만약 그 확률이 0.003이라면, 우리는 이렇게 말할 수 있습니다.&lt;/p&gt;
&lt;blockquote data-end=&quot;435&quot; data-start=&quot;408&quot; data-ke-style=&quot;style1&quot;&gt;
&lt;p data-end=&quot;435&quot; data-start=&quot;410&quot; data-ke-size=&quot;size16&quot;&gt;&amp;ldquo;이건 우연이라고 보기엔 너무 희귀하네.&amp;rdquo;&lt;/p&gt;
&lt;/blockquote&gt;
&lt;p data-end=&quot;547&quot; data-start=&quot;437&quot; data-ke-size=&quot;size16&quot;&gt;즉, &lt;b&gt;p-value가 작을수록 &amp;lsquo;우연이 아닐 가능성&amp;rsquo;이 커 보인다&lt;/b&gt;는 뜻이에요.&lt;br /&gt;(정확히는, 귀무가설 하에서 이런 데이터가 나올 확률이 작다는 거지만 감으로는 이게 훨씬 직관적입니다.)&lt;/p&gt;
&lt;hr data-end=&quot;552&quot; data-start=&quot;549&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;591&quot; data-start=&quot;554&quot; data-ke-size=&quot;size26&quot;&gt;2️⃣ p-value는 &amp;lsquo;데이터가 나를 놀라게 하는 정도&amp;rsquo;&lt;/h2&gt;
&lt;p data-end=&quot;620&quot; data-start=&quot;592&quot; data-ke-size=&quot;size16&quot;&gt;통계적 유의성은 사실 놀람의 크기와 비슷합니다.&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;682&quot; data-start=&quot;621&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;650&quot; data-start=&quot;621&quot;&gt;p-value가 크면 &amp;rarr; &amp;ldquo;그럴 수도 있지.&amp;rdquo;&lt;/li&gt;
&lt;li data-end=&quot;682&quot; data-start=&quot;651&quot;&gt;p-value가 작으면 &amp;rarr; &amp;ldquo;이건 좀 이상한데?&amp;rdquo;&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-end=&quot;783&quot; data-start=&quot;684&quot; data-ke-size=&quot;size16&quot;&gt;예를 들어, 새로 만든 비료가 작물 성장률을 5% 높였다면&lt;br /&gt;그게 자연스러운 변동인지, 아니면 정말 비료 덕분인지 궁금하죠.&lt;br /&gt;p-value는 바로 그 경계를 정해줍니다.&lt;/p&gt;
&lt;blockquote data-end=&quot;850&quot; data-start=&quot;785&quot; data-ke-style=&quot;style1&quot;&gt;
&lt;p data-end=&quot;850&quot; data-start=&quot;787&quot; data-ke-size=&quot;size16&quot;&gt;&amp;ldquo;이 정도 차이는 그냥 우연일 수도 있겠는데(p=0.2)&amp;rdquo;&lt;br /&gt;&amp;ldquo;이건 우연이라 보기 어렵다(p=0.01)&amp;rdquo;&lt;/p&gt;
&lt;/blockquote&gt;
&lt;p data-end=&quot;883&quot; data-start=&quot;852&quot; data-ke-size=&quot;size16&quot;&gt;이걸 숫자로 말해주는 게 p-value의 역할이에요.&lt;/p&gt;
&lt;hr data-end=&quot;888&quot; data-start=&quot;885&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;918&quot; data-start=&quot;890&quot; data-ke-size=&quot;size26&quot;&gt;3️⃣ 0.05는 &amp;lsquo;마법의 숫자&amp;rsquo;가 아니다&lt;/h2&gt;
&lt;p data-end=&quot;1032&quot; data-start=&quot;919&quot; data-ke-size=&quot;size16&quot;&gt;많은 교재에서 &amp;ldquo;p &amp;lt; 0.05면 유의하다&amp;rdquo;고 배우지만,&lt;br /&gt;그건 절대적인 기준이 아니라 &lt;b&gt;약속 같은 관습&lt;/b&gt;이에요.&lt;br /&gt;상황에 따라 더 엄격하게(0.01) 보거나, 느슨하게(0.1) 봐도 됩니다.&lt;/p&gt;
&lt;p data-end=&quot;1042&quot; data-start=&quot;1034&quot; data-ke-size=&quot;size16&quot;&gt;중요한 건,&lt;/p&gt;
&lt;blockquote data-end=&quot;1121&quot; data-start=&quot;1043&quot; data-ke-style=&quot;style1&quot;&gt;
&lt;p data-end=&quot;1121&quot; data-start=&quot;1045&quot; data-ke-size=&quot;size16&quot;&gt;&amp;ldquo;이 p-value가 지금 상황에서 어떤 &amp;lsquo;결정&amp;rsquo;을 정당화하나?&amp;rdquo;&lt;br /&gt;이지,&lt;br /&gt;&amp;ldquo;이 숫자가 0.05 밑인가?&amp;rdquo;&lt;br /&gt;가 아니에요.&lt;/p&gt;
&lt;/blockquote&gt;
&lt;hr data-end=&quot;1126&quot; data-start=&quot;1123&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;1162&quot; data-start=&quot;1128&quot; data-ke-size=&quot;size26&quot;&gt;4️⃣ p-value가 작다고 진실이 되는 건 아니다&lt;/h2&gt;
&lt;p data-end=&quot;1232&quot; data-start=&quot;1163&quot; data-ke-size=&quot;size16&quot;&gt;p-value는 단지 &lt;b&gt;데이터와 가설이 얼마나 어색한지&lt;/b&gt;를 말해줄 뿐,&lt;br /&gt;가설이 참인지 거짓인지를 말하진 않습니다.&lt;/p&gt;
&lt;p data-end=&quot;1330&quot; data-start=&quot;1234&quot; data-ke-size=&quot;size16&quot;&gt;&amp;ldquo;p&amp;lt;0.05니까 내 주장은 맞다!&amp;rdquo;는 말은&lt;br /&gt;&amp;ldquo;비가 오니까 내가 세차를 해서 그렇다&amp;rdquo; 수준의 비약이에요.&lt;br /&gt;우연이 아닐 가능성은 높지만, 인과는 아직 모르는 거죠.&lt;/p&gt;
&lt;hr data-end=&quot;1335&quot; data-start=&quot;1332&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;1367&quot; data-start=&quot;1337&quot; data-ke-size=&quot;size26&quot;&gt;5️⃣ p-value를 바라보는 더 좋은 관점&lt;/h2&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;1439&quot; data-start=&quot;1368&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;1391&quot; data-start=&quot;1368&quot;&gt;&lt;b&gt;귀무가설 하에서의 놀람 정도&lt;/b&gt;&lt;/li&gt;
&lt;li data-end=&quot;1424&quot; data-start=&quot;1392&quot;&gt;&lt;b&gt;데이터가 가설과 얼마나 안 어울리는가의 척도&lt;/b&gt;&lt;/li&gt;
&lt;li data-end=&quot;1439&quot; data-start=&quot;1425&quot;&gt;&lt;b&gt;의심의 강도&lt;/b&gt;&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-end=&quot;1545&quot; data-start=&quot;1441&quot; data-ke-size=&quot;size16&quot;&gt;이렇게 생각하면 외우지 않아도 감이 잡힙니다.&lt;br /&gt;p-value는 &amp;lsquo;판단 기준&amp;rsquo;이 아니라 &amp;lsquo;판단의 온도계&amp;rsquo;예요.&lt;br /&gt;데이터를 보고 얼마나 놀랐는지, 그 감각을 숫자로 표현한 것뿐이죠.&lt;/p&gt;
&lt;hr data-end=&quot;1550&quot; data-start=&quot;1547&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;1568&quot; data-start=&quot;1552&quot; data-ke-size=&quot;size26&quot;&gt;6️⃣ 예시로 마무리&lt;/h2&gt;
&lt;div&gt;
&lt;div&gt;&lt;b&gt;상황&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; p-value 해석&lt;/b&gt;
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-end=&quot;1748&quot; data-start=&quot;1569&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody data-end=&quot;1748&quot; data-start=&quot;1618&quot;&gt;
&lt;tr data-end=&quot;1668&quot; data-start=&quot;1618&quot;&gt;
&lt;td data-col-size=&quot;sm&quot; data-end=&quot;1649&quot; data-start=&quot;1618&quot;&gt;새로운 약이 기존 약보다 효과 2배, p=0.001&lt;/td&gt;
&lt;td data-col-size=&quot;sm&quot; data-end=&quot;1668&quot; data-start=&quot;1649&quot;&gt;&amp;ldquo;이건 거의 확실히 다르다&amp;rdquo;&lt;/td&gt;
&lt;td data-col-size=&quot;sm&quot;&gt;&amp;nbsp;&lt;/td&gt;
&lt;/tr&gt;
&lt;tr data-end=&quot;1710&quot; data-start=&quot;1669&quot;&gt;
&lt;td data-col-size=&quot;sm&quot; data-end=&quot;1692&quot; data-start=&quot;1669&quot;&gt;실험 결과 약간의 차이, p=0.07&lt;/td&gt;
&lt;td data-col-size=&quot;sm&quot; data-end=&quot;1710&quot; data-start=&quot;1692&quot;&gt;&amp;ldquo;미묘하네, 더 봐야겠다&amp;rdquo;&lt;/td&gt;
&lt;td data-col-size=&quot;sm&quot;&gt;&amp;nbsp;&lt;/td&gt;
&lt;/tr&gt;
&lt;tr data-end=&quot;1748&quot; data-start=&quot;1711&quot;&gt;
&lt;td data-col-size=&quot;sm&quot; data-end=&quot;1729&quot; data-start=&quot;1711&quot;&gt;차이 거의 없음, p=0.8&lt;/td&gt;
&lt;td data-col-size=&quot;sm&quot; data-end=&quot;1748&quot; data-start=&quot;1729&quot;&gt;&amp;ldquo;그냥 비슷하다고 봐야겠다&amp;rdquo;&lt;/td&gt;
&lt;td data-col-size=&quot;sm&quot;&gt;&amp;nbsp;&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;/div&gt;
&lt;/div&gt;
&lt;p data-end=&quot;1833&quot; data-start=&quot;1750&quot; data-ke-size=&quot;size16&quot;&gt;결국 p-value는 &lt;b&gt;&amp;lsquo;판단의 강도&amp;rsquo;를 숫자로 표현한 신호&lt;/b&gt;예요.&lt;br /&gt;숫자 자체보다 &amp;ldquo;이게 나를 얼마나 설득시키는가&amp;rdquo;를 보는 게 핵심입니다.&lt;/p&gt;
&lt;hr data-end=&quot;1838&quot; data-start=&quot;1835&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;1852&quot; data-start=&quot;1840&quot; data-ke-size=&quot;size26&quot;&gt;7️⃣ 마무리&lt;/h2&gt;
&lt;p data-end=&quot;1963&quot; data-start=&quot;1853&quot; data-ke-size=&quot;size16&quot;&gt;p-value를 이해한다는 건 수학이 아니라 태도에 관한 일입니다.&lt;br /&gt;데이터를 보고, &amp;ldquo;이게 얼마나 우연스럽지 않은가?&amp;rdquo;를 묻는 감각.&lt;br /&gt;그게 생기면 통계는 훨씬 사람 냄새 나게 다가옵니다.&lt;/p&gt;</description>
      <category>Data Analysis/통계&amp;amp;분석</category>
      <category>pvalue</category>
      <category>가설검정</category>
      <category>데이터사고</category>
      <category>데이터해석</category>
      <category>유의확률</category>
      <category>통계</category>
      <category>통계적사고</category>
      <author>Allen93</author>
      <guid isPermaLink="true">https://allensdatablog.tistory.com/457</guid>
      <comments>https://allensdatablog.tistory.com/entry/%ED%86%B5%EA%B3%84%EC%97%90%EC%84%9C-p-value%EB%A5%BC-%E2%80%98%EA%B0%90%EC%9C%BC%EB%A1%9C%E2%80%99-%EC%9D%B4%ED%95%B4%ED%95%98%EB%8A%94-%EB%B2%95#entry457comment</comments>
      <pubDate>Wed, 3 Dec 2025 20:09:52 +0900</pubDate>
    </item>
    <item>
      <title>EDA(탐색적 데이터 분석)는 &amp;lsquo;문제 정의&amp;rsquo;의 연장선이다</title>
      <link>https://allensdatablog.tistory.com/entry/EDA%ED%83%90%EC%83%89%EC%A0%81-%EB%8D%B0%EC%9D%B4%ED%84%B0-%EB%B6%84%EC%84%9D%EB%8A%94-%E2%80%98%EB%AC%B8%EC%A0%9C-%EC%A0%95%EC%9D%98%E2%80%99%EC%9D%98-%EC%97%B0%EC%9E%A5%EC%84%A0%EC%9D%B4%EB%8B%A4</link>
      <description>&lt;p data-end=&quot;133&quot; data-start=&quot;37&quot; data-ke-size=&quot;size16&quot;&gt;데이터 분석을 시작하면 대부분 이렇게 말하죠.&lt;br /&gt;&amp;ldquo;먼저 EDA를 합니다.&amp;rdquo;&lt;br /&gt;하지만 많은 초보 분석가들이 EDA를 &lt;b&gt;&amp;lsquo;데이터를 구경하는 과정&amp;rsquo;&lt;/b&gt;쯤으로 생각합니다.&lt;/p&gt;
&lt;p data-end=&quot;246&quot; data-start=&quot;135&quot; data-ke-size=&quot;size16&quot;&gt;사실 EDA는 그보다 훨씬 중요한 일입니다.&lt;br /&gt;탐색은 끝이 아니라 &lt;b&gt;&amp;lsquo;문제 정의의 연장선&amp;rsquo;&lt;/b&gt;이에요.&lt;br /&gt;데이터를 들여다보며, 내가 세운 가설이 현실에 맞는지 계속 검증하고 조정하는 과정이죠.&lt;/p&gt;
&lt;hr data-end=&quot;251&quot; data-start=&quot;248&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;287&quot; data-start=&quot;253&quot; data-ke-size=&quot;size26&quot;&gt;1️⃣ 문제 정의는 &amp;ldquo;생각&amp;rdquo;이고, EDA는 &amp;ldquo;증거&amp;rdquo;다&lt;/h2&gt;
&lt;p data-end=&quot;307&quot; data-start=&quot;288&quot; data-ke-size=&quot;size16&quot;&gt;문제 정의는 이렇게 시작합니다.&lt;/p&gt;
&lt;blockquote data-end=&quot;363&quot; data-start=&quot;308&quot; data-ke-style=&quot;style1&quot;&gt;
&lt;p data-end=&quot;363&quot; data-start=&quot;310&quot; data-ke-size=&quot;size16&quot;&gt;&amp;ldquo;판매가 떨어지는 이유가 시즌 요인일까?&amp;rdquo;&lt;br /&gt;&amp;ldquo;고객 이탈이 늘어난 건 가격 때문일까?&amp;rdquo;&lt;/p&gt;
&lt;/blockquote&gt;
&lt;p data-end=&quot;471&quot; data-start=&quot;365&quot; data-ke-size=&quot;size16&quot;&gt;하지만 이건 가설일 뿐이에요.&lt;br /&gt;EDA는 그 가설이 &lt;b&gt;데이터와 실제로 맞닿아 있는지&lt;/b&gt; 확인합니다.&lt;br /&gt;즉, &amp;lsquo;문제를 세운다 &amp;rarr; 데이터를 본다 &amp;rarr; 다시 문제를 다듬는다&amp;rsquo;의 순환 구조.&lt;/p&gt;
&lt;p data-end=&quot;580&quot; data-start=&quot;473&quot; data-ke-size=&quot;size16&quot;&gt;그래서 잘하는 분석가는 &lt;b&gt;EDA 단계에서 문제 정의를 재작성&lt;/b&gt;합니다.&lt;br /&gt;&amp;ldquo;생각보다 시즌보다는 지역별 차이가 크네?&amp;rdquo;&lt;br /&gt;이 한 줄의 통찰이 다음 단계 모델링보다 훨씬 큰 영향을 주죠.&lt;/p&gt;
&lt;hr data-end=&quot;585&quot; data-start=&quot;582&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;619&quot; data-start=&quot;587&quot; data-ke-size=&quot;size26&quot;&gt;2️⃣ EDA는 &amp;lsquo;관찰&amp;rsquo;이 아니라 &amp;lsquo;질문&amp;rsquo;의 과정&lt;/h2&gt;
&lt;p data-end=&quot;702&quot; data-start=&quot;620&quot; data-ke-size=&quot;size16&quot;&gt;단순히 분포를 그려보고, 결측치를 세는 건 반쪽짜리 탐색입니다.&lt;br /&gt;EDA의 진짜 목적은 데이터를 통해 &lt;b&gt;질문을 정교하게 바꾸는 것&lt;/b&gt;이에요.&lt;/p&gt;
&lt;p data-end=&quot;723&quot; data-start=&quot;704&quot; data-ke-size=&quot;size16&quot;&gt;예를 들어 매출 데이터를 보면서&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;793&quot; data-start=&quot;724&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;756&quot; data-start=&quot;724&quot;&gt;&amp;ldquo;이상치가 있네&amp;rdquo; &amp;rarr; &amp;ldquo;왜 특정 달에만 튀었을까?&amp;rdquo;&lt;/li&gt;
&lt;li data-end=&quot;793&quot; data-start=&quot;757&quot;&gt;&amp;ldquo;남성보다 여성 매출이 높네&amp;rdquo; &amp;rarr; &amp;ldquo;연령대별로는 어떤가?&amp;rdquo;&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-end=&quot;870&quot; data-start=&quot;795&quot; data-ke-size=&quot;size16&quot;&gt;이렇게 질문이 깊어지면, 이미 절반은 분석이 끝난 겁니다.&lt;br /&gt;좋은 EDA는 항상 &amp;ldquo;그래서 다음엔 뭘 확인해야 하지?&amp;rdquo;를 남깁니다.&lt;/p&gt;
&lt;hr data-end=&quot;875&quot; data-start=&quot;872&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;907&quot; data-start=&quot;877&quot; data-ke-size=&quot;size26&quot;&gt;3️⃣ 시각화는 &amp;lsquo;확인&amp;rsquo;이 아니라 &amp;lsquo;사고도구&amp;rsquo;&lt;/h2&gt;
&lt;p data-end=&quot;982&quot; data-start=&quot;908&quot; data-ke-size=&quot;size16&quot;&gt;많은 사람들이 그래프를 &amp;ldquo;결과 보여주기용&amp;rdquo;으로만 씁니다.&lt;br /&gt;하지만 탐색 단계의 시각화는 &lt;b&gt;머릿속 모델을 검증하는 도구&lt;/b&gt;예요.&lt;/p&gt;
&lt;p data-end=&quot;1116&quot; data-start=&quot;984&quot; data-ke-size=&quot;size16&quot;&gt;히스토그램을 그릴 때는 분포를 보는 게 아니라,&lt;br /&gt;&amp;ldquo;내가 상상한 패턴이 실제로 존재하나?&amp;rdquo;를 확인하는 거죠.&lt;br /&gt;그래프 하나를 그리고 &amp;ldquo;어? 이건 예상 밖인데?&amp;rdquo; 하는 순간,&lt;br /&gt;EDA는 단순 기술 통계에서 진짜 탐색으로 바뀝니다.&lt;/p&gt;
&lt;hr data-end=&quot;1121&quot; data-start=&quot;1118&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;1142&quot; data-start=&quot;1123&quot; data-ke-size=&quot;size26&quot;&gt;4️⃣ 좋은 EDA의 특징&lt;/h2&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;1273&quot; data-start=&quot;1143&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;1179&quot; data-start=&quot;1143&quot;&gt;데이터의 형태를 설명하지 않고, &lt;b&gt;현상을 이야기&lt;/b&gt;한다.&lt;/li&gt;
&lt;li data-end=&quot;1210&quot; data-start=&quot;1180&quot;&gt;단순 통계보다, &lt;b&gt;패턴과 맥락&lt;/b&gt;을 발견한다.&lt;/li&gt;
&lt;li data-end=&quot;1241&quot; data-start=&quot;1211&quot;&gt;결론을 서두르지 않고, &lt;b&gt;질문을 확장&lt;/b&gt;한다.&lt;/li&gt;
&lt;li data-end=&quot;1273&quot; data-start=&quot;1242&quot;&gt;시각화 결과를 &lt;b&gt;&amp;ldquo;왜?&amp;rdquo;라는 말로 해석&lt;/b&gt;한다.&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-end=&quot;1322&quot; data-start=&quot;1275&quot; data-ke-size=&quot;size16&quot;&gt;EDA는 답을 내는 게 아니라,&lt;br /&gt;&amp;ldquo;어디에 답이 있을지&amp;rdquo;를 좁혀가는 과정입니다.&lt;/p&gt;
&lt;hr data-end=&quot;1327&quot; data-start=&quot;1324&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;1341&quot; data-start=&quot;1329&quot; data-ke-size=&quot;size26&quot;&gt;5️⃣ 마무리&lt;/h2&gt;
&lt;p data-end=&quot;1448&quot; data-start=&quot;1342&quot; data-ke-size=&quot;size16&quot;&gt;EDA는 분석의 첫 단계가 아니라,&lt;br /&gt;&lt;b&gt;&amp;lsquo;문제를 다시 정의하는 두 번째 기회&amp;rsquo;&lt;/b&gt;예요.&lt;br /&gt;처음 세운 가설이 틀렸다는 걸 빨리 깨닫는 게&lt;br /&gt;분석가에게는 가장 값진 순간이기도 합니다.&lt;/p&gt;
&lt;p data-end=&quot;1513&quot; data-start=&quot;1450&quot; data-ke-size=&quot;size16&quot;&gt;데이터를 보는 시선이 바뀌면, 문제의 형태도 달라집니다.&lt;br /&gt;그리고 바로 거기서, 진짜 인사이트가 태어납니다.&lt;/p&gt;</description>
      <category>Data Analysis/통계&amp;amp;분석</category>
      <category>'데이터사고</category>
      <category>Eda</category>
      <category>가설검증</category>
      <category>데이터분석</category>
      <category>문제정의</category>
      <category>인사이트</category>
      <category>탐색적데이터분석</category>
      <author>Allen93</author>
      <guid isPermaLink="true">https://allensdatablog.tistory.com/456</guid>
      <comments>https://allensdatablog.tistory.com/entry/EDA%ED%83%90%EC%83%89%EC%A0%81-%EB%8D%B0%EC%9D%B4%ED%84%B0-%EB%B6%84%EC%84%9D%EB%8A%94-%E2%80%98%EB%AC%B8%EC%A0%9C-%EC%A0%95%EC%9D%98%E2%80%99%EC%9D%98-%EC%97%B0%EC%9E%A5%EC%84%A0%EC%9D%B4%EB%8B%A4#entry456comment</comments>
      <pubDate>Sun, 30 Nov 2025 20:04:16 +0900</pubDate>
    </item>
    <item>
      <title>Pandas groupby를 이해한다는 건 결국 &amp;lsquo;집계의 사고방식&amp;rsquo;을 익히는 일</title>
      <link>https://allensdatablog.tistory.com/entry/Pandas-groupby%EB%A5%BC-%EC%9D%B4%ED%95%B4%ED%95%9C%EB%8B%A4%EB%8A%94-%EA%B1%B4-%EA%B2%B0%EA%B5%AD-%E2%80%98%EC%A7%91%EA%B3%84%EC%9D%98-%EC%82%AC%EA%B3%A0%EB%B0%A9%EC%8B%9D%E2%80%99%EC%9D%84-%EC%9D%B5%ED%9E%88%EB%8A%94-%EC%9D%BC</link>
      <description>&lt;p data-end=&quot;193&quot; data-start=&quot;50&quot; data-ke-size=&quot;size16&quot;&gt;처음 Pandas를 배울 때 가장 헷갈리는 부분이 groupby()죠.&lt;br /&gt;&amp;ldquo;도대체 이게 뭐 하는 함수지?&amp;rdquo;라는 생각이 들다가,&lt;br /&gt;한순간 &amp;lsquo;아, &lt;b&gt;집계의 흐름&lt;/b&gt;을 바꾸는 도구구나&amp;rsquo; 하고 감이 옵니다.&lt;br /&gt;오늘은 그 감을 잡는 이야기를 해볼게요.&lt;/p&gt;
&lt;hr data-end=&quot;198&quot; data-start=&quot;195&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;232&quot; data-start=&quot;200&quot; data-ke-size=&quot;size26&quot;&gt;1️⃣ groupby는 &amp;ldquo;요약을 위한 사고 전환&amp;rdquo;&lt;/h2&gt;
&lt;p data-end=&quot;325&quot; data-start=&quot;233&quot; data-ke-size=&quot;size16&quot;&gt;엑셀 피벗처럼 Pandas의 groupby도 데이터를 묶고 요약합니다.&lt;br /&gt;하지만 단순히 &amp;ldquo;그룹화&amp;rdquo;가 아니라,&lt;b&gt; &amp;lsquo;요약 단위로 사고를 전환&amp;rsquo;&lt;/b&gt;하는 거예요.&lt;/p&gt;
&lt;p data-end=&quot;352&quot; data-start=&quot;327&quot; data-ke-size=&quot;size16&quot;&gt;예를 들어 이런 데이터가 있다고 해봅시다.&lt;/p&gt;
&lt;pre id=&quot;code_1761645346615&quot; class=&quot;python&quot; data-ke-language=&quot;python&quot; data-ke-type=&quot;codeblock&quot;&gt;&lt;code&gt;import pandas as pd

df = pd.DataFrame({
    'team': ['A', 'A', 'B', 'B', 'B', 'C'],
    'score': [10, 12, 20, 18, 15, 8]
})&lt;/code&gt;&lt;/pre&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;ldquo;팀별 평균 점수&amp;rdquo;를 구하고 싶다면 이렇게 쓰죠:&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style3&quot;&gt;df.groupby('team')['score'].mean() &lt;/blockquote&gt;
&lt;p data-end=&quot;681&quot; data-start=&quot;570&quot; data-ke-size=&quot;size16&quot;&gt;여기서 중요한 건 groupby가 &lt;b&gt;데이터를 재정렬한 게 아니라, 사고의 단위를 팀별로 바꿨다&lt;/b&gt;는 겁니다.&lt;br /&gt;이제부터 Pandas는 &amp;ldquo;전체 행&amp;rdquo;이 아니라 &amp;ldquo;각 팀&amp;rdquo;을 기준으로 생각합니다.&lt;/p&gt;
&lt;hr data-end=&quot;686&quot; data-start=&quot;683&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;717&quot; data-start=&quot;688&quot; data-ke-size=&quot;size26&quot;&gt;2️⃣ 집계는 &amp;lsquo;묶고 나서 요약하기&amp;rsquo;의 조합&lt;/h2&gt;
&lt;p data-end=&quot;745&quot; data-start=&quot;718&quot; data-ke-size=&quot;size16&quot;&gt;groupby()는 두 단계로 작동합니다.&lt;/p&gt;
&lt;ol style=&quot;list-style-type: decimal;&quot; data-end=&quot;824&quot; data-start=&quot;747&quot; data-ke-list-type=&quot;decimal&quot;&gt;
&lt;li data-end=&quot;779&quot; data-start=&quot;747&quot;&gt;&lt;b&gt;split&lt;/b&gt; &amp;ndash; 기준 컬럼으로 데이터를 나눔&lt;/li&gt;
&lt;li data-end=&quot;824&quot; data-start=&quot;780&quot;&gt;&lt;b&gt;apply/combine&lt;/b&gt; &amp;ndash; 나눠진 각 덩어리에 집계 함수 적용&lt;/li&gt;
&lt;/ol&gt;
&lt;p data-end=&quot;830&quot; data-start=&quot;826&quot; data-ke-size=&quot;size16&quot;&gt;즉,&lt;/p&gt;
&lt;blockquote data-end=&quot;830&quot; data-start=&quot;826&quot; data-ke-style=&quot;style2&quot;&gt;groupby &amp;rarr; 집계(aggregate)&lt;/blockquote&gt;
&lt;p data-end=&quot;886&quot; data-start=&quot;869&quot; data-ke-size=&quot;size16&quot;&gt;는 사실상 이런 개념이에요.&lt;/p&gt;
&lt;blockquote data-end=&quot;927&quot; data-start=&quot;888&quot; data-ke-style=&quot;style1&quot;&gt;
&lt;p data-end=&quot;927&quot; data-start=&quot;890&quot; data-ke-size=&quot;size16&quot;&gt;&amp;ldquo;데이터를 묶은 뒤, 그룹별로 &amp;lsquo;의미 있는 대표값&amp;rsquo;을 만든다.&amp;rdquo;&lt;/p&gt;
&lt;/blockquote&gt;
&lt;p data-end=&quot;971&quot; data-start=&quot;929&quot; data-ke-size=&quot;size16&quot;&gt;이 사고를 익히면 평균이든, 합계든, 최대&amp;middot;최소든 자연스럽게 이해됩니다.&lt;/p&gt;
&lt;hr data-end=&quot;976&quot; data-start=&quot;973&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;1002&quot; data-start=&quot;978&quot; data-ke-size=&quot;size26&quot;&gt;3️⃣ 하나 이상의 기준으로도 가능&lt;/h2&gt;
&lt;div&gt;
&lt;div&gt;
&lt;blockquote data-ke-style=&quot;style3&quot;&gt;df.groupby(['team', 'region'])['sales'].sum()&lt;/blockquote&gt;
&lt;/div&gt;
&lt;/div&gt;
&lt;p data-end=&quot;1184&quot; data-start=&quot;1065&quot; data-ke-size=&quot;size16&quot;&gt;이건 &amp;ldquo;팀별 + 지역별 합계&amp;rdquo;죠.&lt;br /&gt;결과는 다층 인덱스로 나오는데,&lt;br /&gt;이는 &amp;ldquo;요약의 축이 두 개&amp;rdquo;라는 뜻이에요.&lt;br /&gt;즉, groupby는 단순 계산이 아니라, &lt;b&gt;요약 테이블을 만드는 사고의 도구&lt;/b&gt;입니다.&lt;/p&gt;
&lt;hr data-end=&quot;1189&quot; data-start=&quot;1186&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;1212&quot; data-start=&quot;1191&quot; data-ke-size=&quot;size26&quot;&gt;4️⃣ 직접 집계함수 지정하기&lt;/h2&gt;
&lt;blockquote data-ke-style=&quot;style3&quot;&gt;df.groupby('team').agg({'score':&amp;nbsp;['mean',&amp;nbsp;'max',&amp;nbsp;'min']}) &lt;/blockquote&gt;
&lt;p data-end=&quot;1339&quot; data-start=&quot;1285&quot; data-ke-size=&quot;size16&quot;&gt;한 번에 여러 요약 통계를 낼 수도 있고,&lt;br /&gt;컬럼마다 다른 집계함수를 지정할 수도 있습니다.&lt;/p&gt;
&lt;div&gt;
&lt;div&gt;
&lt;div&gt;
&lt;pre id=&quot;code_1761645403601&quot; class=&quot;python&quot; data-ke-language=&quot;python&quot; data-ke-type=&quot;codeblock&quot;&gt;&lt;code&gt;df.groupby('team').agg({
    'score': 'mean',
    'age': 'max'
})&lt;/code&gt;&lt;/pre&gt;
&lt;/div&gt;
&lt;/div&gt;
&lt;/div&gt;
&lt;p data-end=&quot;1482&quot; data-start=&quot;1422&quot; data-ke-size=&quot;size16&quot;&gt;이렇게 보면 groupby는 단순 함수가 아니라&lt;br /&gt;&amp;ldquo;데이터에서 의미를 추출하는 틀&amp;rdquo;로 작동하는 거예요.&lt;/p&gt;
&lt;hr data-end=&quot;1487&quot; data-start=&quot;1484&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;1519&quot; data-start=&quot;1489&quot; data-ke-size=&quot;size26&quot;&gt;5️⃣ 시야를 바꾸면 groupby가 쉬워진다&lt;/h2&gt;
&lt;p data-end=&quot;1583&quot; data-start=&quot;1520&quot; data-ke-size=&quot;size16&quot;&gt;많은 사람들이 groupby를 어렵게 느끼는 이유는 &amp;ldquo;코드 형태&amp;rdquo; 때문입니다.&lt;br /&gt;하지만 본질은 이거예요:&lt;/p&gt;
&lt;blockquote data-end=&quot;1626&quot; data-start=&quot;1585&quot; data-ke-style=&quot;style1&quot;&gt;
&lt;p data-end=&quot;1626&quot; data-start=&quot;1587&quot; data-ke-size=&quot;size16&quot;&gt;&amp;ldquo;원본 데이터의 개별 행을 잠시 잊고, 그룹 단위로 세상을 본다.&amp;rdquo;&lt;/p&gt;
&lt;/blockquote&gt;
&lt;p data-end=&quot;1724&quot; data-start=&quot;1628&quot; data-ke-size=&quot;size16&quot;&gt;그룹별 요약값을 생각하고, 그걸 숫자로 표현할 뿐이죠.&lt;br /&gt;SQL의 GROUP BY 문법, 엑셀의 피벗 테이블, R의 summarise() 전부 같은 사고입니다.&lt;/p&gt;
&lt;hr data-end=&quot;1729&quot; data-start=&quot;1726&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;1745&quot; data-start=&quot;1731&quot; data-ke-size=&quot;size26&quot;&gt;6️⃣ 정리하자면&lt;/h2&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;1913&quot; data-start=&quot;1746&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;1792&quot; data-start=&quot;1746&quot;&gt;groupby는 데이터를 묶는 게 아니라 &lt;b&gt;요약 단위를 바꾸는 행위&lt;/b&gt;&lt;/li&gt;
&lt;li data-end=&quot;1844&quot; data-start=&quot;1793&quot;&gt;집계는 &amp;ldquo;묶기(split) &amp;rarr; 계산(apply) &amp;rarr; 합치기(combine)&amp;rdquo;의 3단계&lt;/li&gt;
&lt;li data-end=&quot;1880&quot; data-start=&quot;1845&quot;&gt;여러 기준으로 묶거나, 여러 통계를 한 번에 낼 수 있음&lt;/li&gt;
&lt;li data-end=&quot;1913&quot; data-start=&quot;1881&quot;&gt;핵심은 &amp;ldquo;무엇을 기준으로 요약할까?&amp;rdquo;라는 사고 전환&lt;/li&gt;
&lt;/ul&gt;
&lt;hr data-end=&quot;1918&quot; data-start=&quot;1915&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;p data-end=&quot;2031&quot; data-start=&quot;1920&quot; data-ke-size=&quot;size16&quot;&gt;groupby를 이해한다는 건 결국,&lt;br /&gt;&amp;ldquo;데이터를 어떻게 바라볼 것인가&amp;rdquo;의 문제예요.&lt;br /&gt;숫자보다 &lt;b&gt;구조를 본다&lt;/b&gt;는 감각이 생기면,&lt;br /&gt;그때부터 집계는 더 이상 문법이 아니라 직관이 됩니다.&lt;/p&gt;</description>
      <category>Programming/Python</category>
      <category>groupby</category>
      <category>pandas</category>
      <category>python</category>
      <category>데이터분석</category>
      <category>데이터처리</category>
      <category>집계</category>
      <category>피벗</category>
      <author>Allen93</author>
      <guid isPermaLink="true">https://allensdatablog.tistory.com/455</guid>
      <comments>https://allensdatablog.tistory.com/entry/Pandas-groupby%EB%A5%BC-%EC%9D%B4%ED%95%B4%ED%95%9C%EB%8B%A4%EB%8A%94-%EA%B1%B4-%EA%B2%B0%EA%B5%AD-%E2%80%98%EC%A7%91%EA%B3%84%EC%9D%98-%EC%82%AC%EA%B3%A0%EB%B0%A9%EC%8B%9D%E2%80%99%EC%9D%84-%EC%9D%B5%ED%9E%88%EB%8A%94-%EC%9D%BC#entry455comment</comments>
      <pubDate>Thu, 27 Nov 2025 20:00:04 +0900</pubDate>
    </item>
    <item>
      <title>SQL에서 NULL은 왜 골칫거리인가?</title>
      <link>https://allensdatablog.tistory.com/entry/SQL%EC%97%90%EC%84%9C-NULL%EC%9D%80-%EC%99%9C-%EA%B3%A8%EC%B9%AB%EA%B1%B0%EB%A6%AC%EC%9D%B8%EA%B0%80</link>
      <description>&lt;p data-end=&quot;178&quot; data-start=&quot;27&quot; data-ke-size=&quot;size16&quot;&gt;데이터베이스를 조금만 써봐도 금방 느낍니다.&lt;br /&gt;&amp;ldquo;NULL은 그냥 빈값이지, 뭐 어때?&amp;rdquo; 했다가 결과가 이상하게 나오는 그 순간.&lt;br /&gt;NULL은 단순한 &amp;lsquo;빈칸&amp;rsquo;이 아니라 &lt;b&gt;&amp;ldquo;모름(unknown)&lt;/b&gt;&amp;rdquo;이에요.&lt;br /&gt;그리고 이 &amp;lsquo;모름&amp;rsquo;이, SQL의 논리를 흔들어놓습니다.&lt;/p&gt;
&lt;hr data-end=&quot;183&quot; data-start=&quot;180&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;218&quot; data-start=&quot;185&quot; data-ke-size=&quot;size26&quot;&gt;1️⃣ NULL은 0도 아니고, 빈 문자열도 아니다&lt;/h2&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;302&quot; data-start=&quot;219&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;245&quot; data-start=&quot;219&quot;&gt;0은 &amp;ldquo;값이 있음 (단, 그게 0)&amp;rdquo;&lt;/li&gt;
&lt;li data-end=&quot;270&quot; data-start=&quot;246&quot;&gt;''은 &amp;ldquo;문자열인데 내용이 없음&amp;rdquo;&lt;/li&gt;
&lt;li data-end=&quot;302&quot; data-start=&quot;271&quot;&gt;NULL은 &amp;ldquo;&lt;b&gt;값이 아예 존재하지 않음&lt;/b&gt;&amp;rdquo;&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-end=&quot;356&quot; data-start=&quot;304&quot; data-ke-size=&quot;size16&quot;&gt;즉, &amp;ldquo;지금은 모르겠어&amp;rdquo; 상태예요.&lt;br /&gt;이걸 기억하지 않으면 비교나 계산이 전부 꼬입니다.&lt;/p&gt;
&lt;hr data-end=&quot;361&quot; data-start=&quot;358&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;386&quot; data-start=&quot;363&quot; data-ke-size=&quot;size26&quot;&gt;2️⃣ 비교 연산이 통하지 않는다&lt;/h2&gt;
&lt;blockquote data-ke-style=&quot;style3&quot;&gt;SELECT&amp;nbsp;*&amp;nbsp;FROM&amp;nbsp;users&amp;nbsp;WHERE&amp;nbsp;age&amp;nbsp;=&amp;nbsp;NULL;&amp;nbsp;&amp;nbsp;&amp;nbsp;--&amp;nbsp;결과&amp;nbsp;없음 &lt;/blockquote&gt;
&lt;p data-end=&quot;534&quot; data-start=&quot;448&quot; data-ke-size=&quot;size16&quot;&gt;= 연산자는 &amp;ldquo;값이 같음&amp;rdquo;을 판단하지만,&lt;br /&gt;NULL은 &amp;ldquo;값이 없다&amp;rdquo;이기 때문에 비교 자체가 성립하지 않습니다.&lt;br /&gt;그래서 결과가 아예 안 나와요.&lt;/p&gt;
&lt;p data-end=&quot;560&quot; data-start=&quot;536&quot; data-ke-size=&quot;size16&quot;&gt;NULL을 찾고 싶다면 이렇게 써야 합니다.&lt;/p&gt;
&lt;blockquote data-end=&quot;560&quot; data-start=&quot;536&quot; data-ke-style=&quot;style3&quot;&gt;WHERE&amp;nbsp;age&amp;nbsp;IS&amp;nbsp;NULL &lt;/blockquote&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;ldquo;= NULL&amp;rdquo;이 아니라 &amp;ldquo;IS NULL&amp;rdquo;이에요.&lt;br /&gt;이 미묘한 차이를 처음 알게 되는 순간, 대부분은 살짝 화가 납니다.&lt;/p&gt;
&lt;hr data-end=&quot;665&quot; data-start=&quot;662&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;693&quot; data-start=&quot;667&quot; data-ke-size=&quot;size26&quot;&gt;3️⃣ 수식에서도 조용히 문제를 만든다&lt;/h2&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style3&quot;&gt;SELECT&amp;nbsp;price&amp;nbsp;*&amp;nbsp;quantity&amp;nbsp;AS&amp;nbsp;total&amp;nbsp;FROM&amp;nbsp;orders; &lt;/blockquote&gt;
&lt;p data-end=&quot;831&quot; data-start=&quot;752&quot; data-ke-size=&quot;size16&quot;&gt;만약 price나 quantity 중 하나라도 NULL이라면?&lt;br /&gt;total도 NULL이 됩니다.&lt;br /&gt;계산 불가 &amp;rarr; 결과 없음.&lt;/p&gt;
&lt;p data-end=&quot;884&quot; data-start=&quot;833&quot; data-ke-size=&quot;size16&quot;&gt;그래서 실제 분석 쿼리에서는 COALESCE()나 IFNULL()을 자주 씁니다.&lt;/p&gt;
&lt;blockquote data-end=&quot;884&quot; data-start=&quot;833&quot; data-ke-style=&quot;style3&quot;&gt;SELECT&amp;nbsp;COALESCE(price,&amp;nbsp;0)&amp;nbsp;*&amp;nbsp;COALESCE(quantity,&amp;nbsp;0)&amp;nbsp;AS&amp;nbsp;total&amp;nbsp;FROM&amp;nbsp;orders; &lt;/blockquote&gt;
&lt;blockquote data-end=&quot;1016&quot; data-start=&quot;970&quot; data-ke-style=&quot;style1&quot;&gt;
&lt;p data-end=&quot;1016&quot; data-start=&quot;972&quot; data-ke-size=&quot;size16&quot;&gt;COALESCE(a, b)는 a가 NULL이면 b로 대체해주는 함수예요.&lt;/p&gt;
&lt;/blockquote&gt;
&lt;hr data-end=&quot;1021&quot; data-start=&quot;1018&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;1049&quot; data-start=&quot;1023&quot; data-ke-size=&quot;size26&quot;&gt;4️⃣ 논리 연산도 2가 아니라 3이다&lt;/h2&gt;
&lt;p data-end=&quot;1124&quot; data-start=&quot;1051&quot; data-ke-size=&quot;size16&quot;&gt;SQL의 논리에는 TRUE, FALSE 외에 **UNKNOWN**이 있습니다.&lt;br /&gt;NULL이 등장하면 이게 작동하죠.&lt;/p&gt;
&lt;div&gt;
&lt;div&gt;표현식결과
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-end=&quot;1212&quot; data-start=&quot;1126&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody data-end=&quot;1212&quot; data-start=&quot;1149&quot;&gt;
&lt;tr data-end=&quot;1167&quot; data-start=&quot;1149&quot;&gt;
&lt;td data-col-size=&quot;sm&quot; data-end=&quot;1159&quot; data-start=&quot;1149&quot;&gt;1 = 1&lt;/td&gt;
&lt;td data-end=&quot;1167&quot; data-start=&quot;1159&quot; data-col-size=&quot;sm&quot;&gt;TRUE&lt;/td&gt;
&lt;/tr&gt;
&lt;tr data-end=&quot;1187&quot; data-start=&quot;1168&quot;&gt;
&lt;td data-col-size=&quot;sm&quot; data-end=&quot;1178&quot; data-start=&quot;1168&quot;&gt;1 = 2&lt;/td&gt;
&lt;td data-end=&quot;1187&quot; data-start=&quot;1178&quot; data-col-size=&quot;sm&quot;&gt;FALSE&lt;/td&gt;
&lt;/tr&gt;
&lt;tr data-end=&quot;1212&quot; data-start=&quot;1188&quot;&gt;
&lt;td data-col-size=&quot;sm&quot; data-end=&quot;1201&quot; data-start=&quot;1188&quot;&gt;1 = NULL&lt;/td&gt;
&lt;td data-end=&quot;1212&quot; data-start=&quot;1201&quot; data-col-size=&quot;sm&quot;&gt;UNKNOWN&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;/div&gt;
&lt;/div&gt;
&lt;p data-end=&quot;1309&quot; data-start=&quot;1214&quot; data-ke-size=&quot;size16&quot;&gt;이 UNKNOWN 때문에 WHERE 필터에 걸리지 않고 빠져나갑니다.&lt;br /&gt;즉, &amp;ldquo;조건을 만족하지 않는 값&amp;rdquo;이 아니라 &amp;ldquo;조건을 평가할 수 없는 값&amp;rdquo;으로 처리돼요.&lt;/p&gt;
&lt;hr data-end=&quot;1314&quot; data-start=&quot;1311&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;1340&quot; data-start=&quot;1316&quot; data-ke-size=&quot;size26&quot;&gt;5️⃣ 집계함수에서도 조용히 빠진다&lt;/h2&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style3&quot;&gt;SELECT&amp;nbsp;AVG(salary)&amp;nbsp;FROM&amp;nbsp;employees; &lt;/blockquote&gt;
&lt;p data-end=&quot;1459&quot; data-start=&quot;1388&quot; data-ke-size=&quot;size16&quot;&gt;salary에 NULL이 있으면 그 행은 &lt;b&gt;평균 계산에서 제외&lt;/b&gt;됩니다.&lt;br /&gt;0으로 처리되는 게 아니라 그냥 빠집니다.&lt;/p&gt;
&lt;p data-end=&quot;1515&quot; data-start=&quot;1461&quot; data-ke-size=&quot;size16&quot;&gt;그래서 평균이 실제보다 높게 나올 수도 있죠.&lt;br /&gt;이걸 의식하지 않으면 분석 결과가 왜곡돼요.&lt;/p&gt;
&lt;hr data-end=&quot;1520&quot; data-start=&quot;1517&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;1548&quot; data-start=&quot;1522&quot; data-ke-size=&quot;size26&quot;&gt;6️⃣ 그렇다면 NULL은 나쁜 걸까?&lt;/h2&gt;
&lt;p data-end=&quot;1641&quot; data-start=&quot;1550&quot; data-ke-size=&quot;size16&quot;&gt;그렇진 않습니다.&lt;br /&gt;NULL은 &amp;ldquo;아직 모르는 것&amp;rdquo;을 표현하기 위한 필요악 같은 존재예요.&lt;br /&gt;문제는 우리가 &lt;b&gt;모름을 모른 채 계산하려고 할 때&lt;/b&gt; 생깁니다.&lt;/p&gt;
&lt;p data-end=&quot;1670&quot; data-start=&quot;1643&quot; data-ke-size=&quot;size16&quot;&gt;좋은 데이터베이스 설계에서는 다음을 고민하죠.&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;1765&quot; data-start=&quot;1671&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;1705&quot; data-start=&quot;1671&quot;&gt;NULL이 의미 있는 칸인가, 아니면 잘못된 입력인가?&lt;/li&gt;
&lt;li data-end=&quot;1730&quot; data-start=&quot;1706&quot;&gt;NULL을 0으로 대체해도 괜찮은가?&lt;/li&gt;
&lt;li data-end=&quot;1765&quot; data-start=&quot;1731&quot;&gt;쿼리 결과에 NULL이 들어오면 어떻게 처리할 것인가?&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-end=&quot;1803&quot; data-start=&quot;1767&quot; data-ke-size=&quot;size16&quot;&gt;이런 고민이 있어야 통계나 대시보드의 수치가 신뢰를 얻습니다.&lt;/p&gt;
&lt;hr data-end=&quot;1808&quot; data-start=&quot;1805&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;1824&quot; data-start=&quot;1810&quot; data-ke-size=&quot;size26&quot;&gt;7️⃣ 정리하자면&lt;/h2&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;1974&quot; data-start=&quot;1825&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;1868&quot; data-start=&quot;1825&quot;&gt;NULL은 &amp;ldquo;모름(unknown)&amp;rdquo;이지, &amp;ldquo;0&amp;rdquo;이나 &amp;ldquo;빈값&amp;rdquo;이 아니다.&lt;/li&gt;
&lt;li data-end=&quot;1929&quot; data-start=&quot;1869&quot;&gt;=, &amp;lt;&amp;gt; 같은 비교는 통하지 않는다. (IS NULL / IS NOT NULL 사용)&lt;/li&gt;
&lt;li data-end=&quot;1955&quot; data-start=&quot;1930&quot;&gt;계산&amp;middot;집계&amp;middot;논리에서 모두 영향을 준다.&lt;/li&gt;
&lt;li data-end=&quot;1974&quot; data-start=&quot;1956&quot;&gt;무시하면 결과가 왜곡된다.&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-end=&quot;2056&quot; data-start=&quot;1976&quot; data-ke-size=&quot;size16&quot;&gt;NULL은 귀찮지만, SQL을 이해하는 가장 좋은 교재이기도 합니다.&lt;br /&gt;그 존재를 의식하기 시작하면, 데이터의 질을 보는 눈이 달라집니다.&lt;/p&gt;</description>
      <category>DataBase/SQL</category>
      <category>DB</category>
      <category>null</category>
      <category>SQL</category>
      <category>결측치</category>
      <category>데이터베이스</category>
      <category>데이터분석</category>
      <category>데이터품질</category>
      <category>집계함수</category>
      <category>쿼리</category>
      <author>Allen93</author>
      <guid isPermaLink="true">https://allensdatablog.tistory.com/454</guid>
      <comments>https://allensdatablog.tistory.com/entry/SQL%EC%97%90%EC%84%9C-NULL%EC%9D%80-%EC%99%9C-%EA%B3%A8%EC%B9%AB%EA%B1%B0%EB%A6%AC%EC%9D%B8%EA%B0%80#entry454comment</comments>
      <pubDate>Mon, 24 Nov 2025 19:53:43 +0900</pubDate>
    </item>
    <item>
      <title>ChatGPT said:SQLite3: 가볍지만 꽤 단단한 데이터베이스</title>
      <link>https://allensdatablog.tistory.com/entry/ChatGPT-saidSQLite3-%EA%B0%80%EB%B3%8D%EC%A7%80%EB%A7%8C-%EA%BD%A4-%EB%8B%A8%EB%8B%A8%ED%95%9C-%EB%8D%B0%EC%9D%B4%ED%84%B0%EB%B2%A0%EC%9D%B4%EC%8A%A4</link>
      <description>&lt;p data-end=&quot;175&quot; data-start=&quot;32&quot; data-ke-size=&quot;size16&quot;&gt;파이썬에서 데이터를 다루다 보면 &amp;ldquo;엑셀 말고, 좀 더 체계적으로 저장할 방법 없을까?&amp;rdquo; 싶을 때가 있죠. 그럴 때 딱 맞는 게 &lt;b&gt;SQLite3&lt;/b&gt;입니다. 설치할 것도, 서버를 켤 것도 필요 없어요. 그저 하나의 .db 파일이 곧 데이터베이스입니다.&lt;/p&gt;
&lt;hr data-end=&quot;180&quot; data-start=&quot;177&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;204&quot; data-start=&quot;182&quot; data-ke-size=&quot;size26&quot;&gt;1️⃣ SQLite3가 뭔데요?&lt;/h2&gt;
&lt;p data-end=&quot;247&quot; data-start=&quot;205&quot; data-ke-size=&quot;size16&quot;&gt;SQLite는 이름 그대로 &amp;ldquo;가벼운(Lite) SQL 데이터베이스&amp;rdquo;예요.&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;411&quot; data-start=&quot;248&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;288&quot; data-start=&quot;248&quot;&gt;&lt;b&gt;파일 하나로 동작&lt;/b&gt;: 데이터베이스가 파일 단위로 저장됩니다.&lt;/li&gt;
&lt;li data-end=&quot;345&quot; data-start=&quot;289&quot;&gt;&lt;b&gt;별도 서버 불필요&lt;/b&gt;: MySQL이나 PostgreSQL처럼 서버를 띄울 필요가 없습니다.&lt;/li&gt;
&lt;li data-end=&quot;411&quot; data-start=&quot;346&quot;&gt;&lt;b&gt;표준 SQL 지원&lt;/b&gt;: SELECT, WHERE, JOIN 같은 익숙한 구문 그대로 사용 가능.&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-end=&quot;454&quot; data-start=&quot;413&quot; data-ke-size=&quot;size16&quot;&gt;그래서 간단한 분석, 로컬 앱, 혹은 프로토타입 DB로 많이 쓰입니다.&lt;/p&gt;
&lt;hr data-end=&quot;459&quot; data-start=&quot;456&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;479&quot; data-start=&quot;461&quot; data-ke-size=&quot;size26&quot;&gt;2️⃣ 파이썬에서 써보기&lt;/h2&gt;
&lt;p data-end=&quot;533&quot; data-start=&quot;481&quot; data-ke-size=&quot;size16&quot;&gt;SQLite는 파이썬에 이미 내장돼 있어요. import sqlite3만 하면 됩니다.&lt;/p&gt;
&lt;pre id=&quot;code_1761644764616&quot; class=&quot;python&quot; data-ke-language=&quot;python&quot; data-ke-type=&quot;codeblock&quot;&gt;&lt;code&gt;import sqlite3

# DB 연결 (파일이 없으면 자동 생성)
conn = sqlite3.connect(&quot;example.db&quot;)
cur = conn.cursor()

# 테이블 만들기
cur.execute(&quot;&quot;&quot;
CREATE TABLE IF NOT EXISTS users (
    id INTEGER PRIMARY KEY,
    name TEXT,
    age INTEGER
)
&quot;&quot;&quot;)

# 데이터 넣기
cur.execute(&quot;INSERT INTO users (name, age) VALUES (?, ?)&quot;, (&quot;Alice&quot;, 25))
conn.commit()

# 조회
cur.execute(&quot;SELECT * FROM users&quot;)
print(cur.fetchall())

conn.close()&lt;/code&gt;&lt;/pre&gt;
&lt;p data-end=&quot;987&quot; data-start=&quot;950&quot; data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-end=&quot;987&quot; data-start=&quot;950&quot; data-ke-size=&quot;size16&quot;&gt;단 세 줄로 DB 만들고, 바로 데이터를 읽고 쓸 수 있습니다.&lt;/p&gt;
&lt;hr data-end=&quot;992&quot; data-start=&quot;989&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;1008&quot; data-start=&quot;994&quot; data-ke-size=&quot;size26&quot;&gt;3️⃣ 장점 요약&lt;/h2&gt;
&lt;div&gt;
&lt;div&gt;&lt;b&gt;항목&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;설명&lt;/b&gt;
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-end=&quot;1175&quot; data-start=&quot;1009&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody data-end=&quot;1175&quot; data-start=&quot;1037&quot;&gt;
&lt;tr data-end=&quot;1068&quot; data-start=&quot;1037&quot;&gt;
&lt;td data-col-size=&quot;sm&quot; data-end=&quot;1050&quot; data-start=&quot;1037&quot;&gt;&lt;b&gt;설치 불필요&lt;/b&gt;&lt;/td&gt;
&lt;td data-end=&quot;1068&quot; data-start=&quot;1050&quot; data-col-size=&quot;sm&quot;&gt;파이썬만 있으면 바로 사용&lt;/td&gt;
&lt;/tr&gt;
&lt;tr data-end=&quot;1098&quot; data-start=&quot;1069&quot;&gt;
&lt;td data-col-size=&quot;sm&quot; data-end=&quot;1079&quot; data-start=&quot;1069&quot;&gt;&lt;b&gt;가벼움&lt;/b&gt;&lt;/td&gt;
&lt;td data-end=&quot;1098&quot; data-start=&quot;1079&quot; data-col-size=&quot;sm&quot;&gt;단일 .db 파일로 동작&lt;/td&gt;
&lt;/tr&gt;
&lt;tr data-end=&quot;1142&quot; data-start=&quot;1099&quot;&gt;
&lt;td data-col-size=&quot;sm&quot; data-end=&quot;1112&quot; data-start=&quot;1099&quot;&gt;&lt;b&gt;이식성 높음&lt;/b&gt;&lt;/td&gt;
&lt;td data-end=&quot;1142&quot; data-start=&quot;1112&quot; data-col-size=&quot;sm&quot;&gt;파일 복사만으로 다른 컴퓨터에서 바로 실행 가능&lt;/td&gt;
&lt;/tr&gt;
&lt;tr data-end=&quot;1175&quot; data-start=&quot;1143&quot;&gt;
&lt;td data-col-size=&quot;sm&quot; data-end=&quot;1156&quot; data-start=&quot;1143&quot;&gt;&lt;b&gt;SQL 표준&lt;/b&gt;&lt;/td&gt;
&lt;td data-end=&quot;1175&quot; data-start=&quot;1156&quot; data-col-size=&quot;sm&quot;&gt;다른 DB로 전환하기도 쉬움&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;/div&gt;
&lt;/div&gt;
&lt;hr data-end=&quot;1180&quot; data-start=&quot;1177&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;1196&quot; data-start=&quot;1182&quot; data-ke-size=&quot;size26&quot;&gt;4️⃣ 주의할 점&lt;/h2&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;1321&quot; data-start=&quot;1197&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;1255&quot; data-start=&quot;1197&quot;&gt;&lt;b&gt;여러 사용자가 동시에 접근&lt;/b&gt;하는 환경에는 부적합합니다. (파일 기반이라 동시 쓰기에 약해요)&lt;/li&gt;
&lt;li data-end=&quot;1321&quot; data-start=&quot;1256&quot;&gt;&lt;b&gt;대규모 트래픽&lt;/b&gt;이 필요한 서비스라면 MySQL, PostgreSQL 같은 서버형 DB를 고려해야 합니다.&lt;/li&gt;
&lt;/ul&gt;
&lt;hr data-end=&quot;1326&quot; data-start=&quot;1323&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;1359&quot; data-start=&quot;1328&quot; data-ke-size=&quot;size26&quot;&gt;5️⃣ 데이터 분석에서 SQLite가 좋은 이유&lt;/h2&gt;
&lt;p data-end=&quot;1489&quot; data-start=&quot;1360&quot; data-ke-size=&quot;size16&quot;&gt;CSV로만 분석하면 매번 read_csv()로 불러와야 하지만, SQLite에 한 번 저장해두면 SELECT 문으로 필요한 부분만 불러올 수 있습니다.&lt;br /&gt;대용량 CSV보다 빠르고, 중복 데이터를 관리하기도 훨씬 편하죠.&lt;/p&gt;
&lt;pre id=&quot;code_1761644892776&quot; class=&quot;python&quot; data-ke-language=&quot;python&quot; data-ke-type=&quot;codeblock&quot;&gt;&lt;code&gt;import pandas as pd
conn = sqlite3.connect(&quot;example.db&quot;)
df = pd.read_sql_query(&quot;SELECT * FROM users WHERE age &amp;gt; 20&quot;, conn)&lt;/code&gt;&lt;/pre&gt;
&lt;p data-end=&quot;1694&quot; data-start=&quot;1630&quot; data-ke-size=&quot;size16&quot;&gt;분석용 데이터 저장소로 SQLite를 써두면, &lt;b&gt;가벼운 SQL + Pandas 조합&lt;/b&gt;이 훌륭하게 맞물립니다.&lt;/p&gt;
&lt;hr data-end=&quot;1699&quot; data-start=&quot;1696&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;1713&quot; data-start=&quot;1701&quot; data-ke-size=&quot;size26&quot;&gt;6️⃣ 마무리&lt;/h2&gt;
&lt;p data-end=&quot;1833&quot; data-start=&quot;1714&quot; data-ke-size=&quot;size16&quot;&gt;SQLite는 &amp;ldquo;작은 규모지만 깔끔한 관리가 필요한 데이터&amp;rdquo;에 정말 잘 어울립니다.&lt;br /&gt;데이터가 커지면 언제든 더 큰 DB로 옮길 수도 있고요.&lt;br /&gt;개발자 입장에선 &amp;ldquo;정리 정돈 잘 된 메모장&amp;rdquo; 같은 존재랄까요.&lt;/p&gt;</description>
      <category>DataBase/SQL</category>
      <category>Database</category>
      <category>DB</category>
      <category>python</category>
      <category>SQL</category>
      <category>SQLite3</category>
      <category>데이터관리</category>
      <category>데이터분석</category>
      <category>파이썬</category>
      <author>Allen93</author>
      <guid isPermaLink="true">https://allensdatablog.tistory.com/453</guid>
      <comments>https://allensdatablog.tistory.com/entry/ChatGPT-saidSQLite3-%EA%B0%80%EB%B3%8D%EC%A7%80%EB%A7%8C-%EA%BD%A4-%EB%8B%A8%EB%8B%A8%ED%95%9C-%EB%8D%B0%EC%9D%B4%ED%84%B0%EB%B2%A0%EC%9D%B4%EC%8A%A4#entry453comment</comments>
      <pubDate>Sat, 22 Nov 2025 19:48:39 +0900</pubDate>
    </item>
    <item>
      <title>미니콘다 vs 아나콘다: 뭐가 내 스타일일까?</title>
      <link>https://allensdatablog.tistory.com/entry/%EB%AF%B8%EB%8B%88%EC%BD%98%EB%8B%A4-vs-%EC%95%84%EB%82%98%EC%BD%98%EB%8B%A4-%EB%AD%90%EA%B0%80-%EB%82%B4-%EC%8A%A4%ED%83%80%EC%9D%BC%EC%9D%BC%EA%B9%8C</link>
      <description>&lt;p data-end=&quot;129&quot; data-start=&quot;29&quot; data-ke-size=&quot;size16&quot;&gt;&amp;ldquo;파이썬 깔아야 하는데, 미니콘다? 아나콘다? 뭐부터 눌러요?&amp;rdquo; 실무에서 제일 자주 듣는 질문이죠. 결론부터 말하면, &lt;b&gt;도구를 고른다기보다 &amp;ldquo;설치 철학&amp;rdquo;을 고르는 선택&lt;/b&gt;입니다.&lt;/p&gt;
&lt;h2 data-end=&quot;148&quot; data-start=&quot;131&quot; data-ke-size=&quot;size26&quot;&gt;한 줄 요약 (TL;DR)&lt;/h2&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;334&quot; data-start=&quot;149&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;208&quot; data-start=&quot;149&quot;&gt;&lt;b&gt;미니콘다(Miniconda)&lt;/b&gt;: 가벼운 기본기 + 필요한 것만 내가 설치. 깔끔, 빠름, 유연함.&lt;/li&gt;
&lt;li data-end=&quot;278&quot; data-start=&quot;209&quot;&gt;&lt;b&gt;아나콘다(Anaconda)&lt;/b&gt;: 데이터 과학용 왕창 세트. 설치 직후 대부분 준비 완료. 대신 무겁고 느릴 수 있음.&lt;/li&gt;
&lt;li data-end=&quot;334&quot; data-start=&quot;279&quot;&gt;&amp;ldquo;처음 시작&amp;rdquo;이면 아나콘다가 편하고, &amp;ldquo;조금만 익숙&amp;rdquo;하면 미니콘다!&lt;/li&gt;
&lt;/ul&gt;
&lt;h2 data-end=&quot;348&quot; data-start=&quot;336&quot; data-ke-size=&quot;size26&quot;&gt;차이를 표로 정리&lt;/h2&gt;
&lt;div&gt;
&lt;div&gt;&lt;b&gt;항목&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 미니콘다&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 아나콘다&lt;/b&gt;
&lt;table style=&quot;border-collapse: collapse; width: 100%; height: 118px;&quot; border=&quot;1&quot; data-end=&quot;647&quot; data-start=&quot;349&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody data-end=&quot;647&quot; data-start=&quot;384&quot;&gt;
&lt;tr style=&quot;height: 18px;&quot; data-end=&quot;410&quot; data-start=&quot;384&quot;&gt;
&lt;td style=&quot;height: 18px;&quot; data-col-size=&quot;sm&quot; data-end=&quot;392&quot; data-start=&quot;384&quot;&gt;기본 용량&lt;/td&gt;
&lt;td style=&quot;height: 18px;&quot; data-col-size=&quot;sm&quot; data-end=&quot;401&quot; data-start=&quot;392&quot;&gt;수백 MB대&lt;/td&gt;
&lt;td style=&quot;height: 18px;&quot; data-col-size=&quot;sm&quot; data-end=&quot;410&quot; data-start=&quot;401&quot;&gt;수 GB대&lt;/td&gt;
&lt;/tr&gt;
&lt;tr style=&quot;height: 18px;&quot; data-end=&quot;483&quot; data-start=&quot;411&quot;&gt;
&lt;td style=&quot;height: 18px;&quot; data-col-size=&quot;sm&quot; data-end=&quot;420&quot; data-start=&quot;411&quot;&gt;기본 패키지&lt;/td&gt;
&lt;td style=&quot;height: 18px;&quot; data-col-size=&quot;sm&quot; data-end=&quot;443&quot; data-start=&quot;420&quot;&gt;최소(conda, 파이썬, 핵심 툴)&lt;/td&gt;
&lt;td style=&quot;height: 18px;&quot; data-col-size=&quot;sm&quot; data-end=&quot;483&quot; data-start=&quot;443&quot;&gt;넘치는 과학 패키지(NumPy, Pandas, Jupyter 등)&lt;/td&gt;
&lt;/tr&gt;
&lt;tr style=&quot;height: 18px;&quot; data-end=&quot;507&quot; data-start=&quot;484&quot;&gt;
&lt;td style=&quot;height: 18px;&quot; data-col-size=&quot;sm&quot; data-end=&quot;492&quot; data-start=&quot;484&quot;&gt;설치 시간&lt;/td&gt;
&lt;td style=&quot;height: 18px;&quot; data-col-size=&quot;sm&quot; data-end=&quot;497&quot; data-start=&quot;492&quot;&gt;짧음&lt;/td&gt;
&lt;td style=&quot;height: 18px;&quot; data-end=&quot;507&quot; data-start=&quot;497&quot; data-col-size=&quot;sm&quot;&gt;김.&amp;nbsp;&lt;/td&gt;
&lt;/tr&gt;
&lt;tr style=&quot;height: 18px;&quot; data-end=&quot;554&quot; data-start=&quot;508&quot;&gt;
&lt;td style=&quot;height: 18px;&quot; data-col-size=&quot;sm&quot; data-end=&quot;518&quot; data-start=&quot;508&quot;&gt;업데이트 부담&lt;/td&gt;
&lt;td style=&quot;height: 18px;&quot; data-col-size=&quot;sm&quot; data-end=&quot;534&quot; data-start=&quot;518&quot;&gt;낮음(설치한 것만 관리)&lt;/td&gt;
&lt;td style=&quot;height: 18px;&quot; data-col-size=&quot;sm&quot; data-end=&quot;554&quot; data-start=&quot;534&quot;&gt;높음(많은 패키지 동시 관리)&lt;/td&gt;
&lt;/tr&gt;
&lt;tr style=&quot;height: 18px;&quot; data-end=&quot;599&quot; data-start=&quot;555&quot;&gt;
&lt;td style=&quot;height: 18px;&quot; data-col-size=&quot;sm&quot; data-end=&quot;560&quot; data-start=&quot;555&quot;&gt;대상&lt;/td&gt;
&lt;td style=&quot;height: 18px;&quot; data-col-size=&quot;sm&quot; data-end=&quot;582&quot; data-start=&quot;560&quot;&gt;환경을 &amp;ldquo;내가&amp;rdquo; 구성하고 싶은 사람&lt;/td&gt;
&lt;td style=&quot;height: 18px;&quot; data-col-size=&quot;sm&quot; data-end=&quot;599&quot; data-start=&quot;582&quot;&gt;바로 분석하고 싶은 사람&lt;/td&gt;
&lt;/tr&gt;
&lt;tr style=&quot;height: 18px;&quot; data-end=&quot;647&quot; data-start=&quot;600&quot;&gt;
&lt;td style=&quot;height: 18px;&quot; data-col-size=&quot;sm&quot; data-end=&quot;606&quot; data-start=&quot;600&quot;&gt;유연성&lt;/td&gt;
&lt;td style=&quot;height: 18px;&quot; data-col-size=&quot;sm&quot; data-end=&quot;614&quot; data-start=&quot;606&quot;&gt;매우 높음&lt;/td&gt;
&lt;td style=&quot;height: 18px;&quot; data-col-size=&quot;sm&quot; data-end=&quot;647&quot; data-start=&quot;614&quot;&gt;기본은 편하지만, 장기적으로 관리가 번거로울 수 있음&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;/div&gt;
&lt;/div&gt;
&lt;h2 data-end=&quot;665&quot; data-start=&quot;649&quot; data-ke-size=&quot;size26&quot;&gt;실제 체감 포인트 5가지&lt;/h2&gt;
&lt;ol style=&quot;list-style-type: decimal;&quot; data-end=&quot;1321&quot; data-start=&quot;666&quot; data-ke-list-type=&quot;decimal&quot;&gt;
&lt;li data-end=&quot;752&quot; data-start=&quot;666&quot;&gt;&lt;b&gt;디스크/업데이트 스트레스&lt;/b&gt;: 아나콘다는 기본 깔리는 게 많아 업데이트 때 시간과 용량을 가져갑니다. 미니콘다는 필요한 것만 깔아서 깔끔해요.&lt;/li&gt;
&lt;li data-end=&quot;864&quot; data-start=&quot;753&quot;&gt;&lt;b&gt;환경 격리 습관&lt;/b&gt;: 어차피 프로젝트마다 conda create -n myenv python=3.11로 새 환경을 만듭니다. 그러니 &amp;ldquo;처음부터 가볍게 시작&amp;rdquo;하는 게 유리할 때가 많죠.&lt;/li&gt;
&lt;li data-end=&quot;1002&quot; data-start=&quot;865&quot;&gt;&lt;b&gt;설치 직후 편의성&lt;/b&gt;: 아나콘다는 바로 jupyter lab 열고 시작하기 좋습니다. 미니콘다는 conda install jupyterlab numpy pandas 같은 준비가 필요하지만, 그 준비가 사실 1~2분이면 끝나요.&lt;/li&gt;
&lt;li data-end=&quot;1198&quot; data-start=&quot;1003&quot;&gt;&lt;b&gt;채널 선택(특히 conda-forge)&lt;/b&gt;: 요즘엔 두 쪽 다 conda-forge 채널을 많이 씁니다. 최신/호환성 측면에서 이 채널을 기본으로 두면(예: conda config --add channels conda-forge &amp;amp;&amp;amp; conda config --set channel_priority strict) 충돌 줄어들어요.&lt;/li&gt;
&lt;li data-end=&quot;1321&quot; data-start=&quot;1199&quot;&gt;&lt;b&gt;협업 &amp;amp; 재현성&lt;/b&gt;: 아나콘다 &amp;ldquo;기본 세트&amp;rdquo;에 기댈수록 팀원 PC마다 버전이 미묘하게 달라질 수 있습니다. 미니콘다는 &lt;b&gt;명시적으로&lt;/b&gt; environment.yml을 관리하게 되어 재현성이 좋아지는 편이죠.&lt;/li&gt;
&lt;/ol&gt;
&lt;h2 data-end=&quot;1332&quot; data-start=&quot;1323&quot; data-ke-size=&quot;size26&quot;&gt;상황별 추천&lt;/h2&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;1568&quot; data-start=&quot;1333&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;1381&quot; data-start=&quot;1333&quot;&gt;&lt;b&gt;첫 입문 + 바로 분석하고 싶음&lt;/b&gt;: 아나콘다. (딱 켜서 노트북 열면 끝)&lt;/li&gt;
&lt;li data-end=&quot;1445&quot; data-start=&quot;1382&quot;&gt;&lt;b&gt;프로젝트 여러 개 + 깔끔 관리 중시&lt;/b&gt;: 미니콘다. (환경이 가벼워서 충돌/업데이트 스트레스가 적음)&lt;/li&gt;
&lt;li data-end=&quot;1474&quot; data-start=&quot;1446&quot;&gt;&lt;b&gt;회사 PC 용량이 빠듯함&lt;/b&gt;: 미니콘다.&lt;/li&gt;
&lt;li data-end=&quot;1568&quot; data-start=&quot;1475&quot;&gt;&lt;b&gt;수업/강의 따라가기&lt;/b&gt;: 강사가 &amp;ldquo;아나콘다 기준&amp;rdquo;이면 그냥 아나콘다로 편하게 가세요. 기준이 없다면 미니콘다 + environment.yml 제공이 베스트.&lt;/li&gt;
&lt;/ul&gt;
&lt;h2 data-end=&quot;1591&quot; data-start=&quot;1570&quot; data-ke-size=&quot;size26&quot;&gt;미니콘다를 위한 최소 셋업 예시&lt;/h2&gt;
&lt;div&gt;
&lt;div&gt;&amp;nbsp;&lt;/div&gt;
&lt;/div&gt;
&lt;pre id=&quot;code_1761643609086&quot; class=&quot;bash&quot; data-ke-language=&quot;bash&quot; data-ke-type=&quot;codeblock&quot;&gt;&lt;code&gt;# 미니콘다 설치 후
conda create -n ds python=3.11
conda activate ds
conda config --add channels conda-forge
conda config --set channel_priority strict
conda install jupyterlab numpy pandas matplotlib scikit-learn&lt;/code&gt;&lt;/pre&gt;
&lt;h2 data-end=&quot;1865&quot; data-start=&quot;1843&quot; data-ke-size=&quot;size26&quot;&gt;아나콘다 쓰는데 너무 무겁다 싶다면&lt;/h2&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;1993&quot; data-start=&quot;1866&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;1911&quot; data-start=&quot;1866&quot;&gt;새 프로젝트부터는 &lt;b&gt;미니콘다&lt;/b&gt;로 전환해도 됩니다. 둘이 공존 가능해요.&lt;/li&gt;
&lt;li data-end=&quot;1993&quot; data-start=&quot;1912&quot;&gt;당장 바꾸기 부담되면, 아나콘다 그대로 두고 &lt;b&gt;프로젝트별 가상환경&lt;/b&gt;만 잘게 쪼개 쓰세요. 핵심은 &amp;ldquo;기본(base)을 건드리지 말자&amp;rdquo;입니다.&lt;/li&gt;
&lt;/ul&gt;
&lt;h2 data-end=&quot;2010&quot; data-start=&quot;1995&quot; data-ke-size=&quot;size26&quot;&gt;자주 나오는 오해 정리&lt;/h2&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;2317&quot; data-start=&quot;2011&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;2083&quot; data-start=&quot;2011&quot;&gt;&lt;b&gt;&amp;ldquo;미니콘다는 기능이 부족하다?&amp;rdquo;&lt;/b&gt; &amp;rarr; 아니요. 필요할 때 설치하면 됩니다. 오히려 정확히 원하는 스택을 만들기 좋죠.&lt;/li&gt;
&lt;li data-end=&quot;2152&quot; data-start=&quot;2084&quot;&gt;&lt;b&gt;&amp;ldquo;아나콘다는 초보용이다?&amp;rdquo;&lt;/b&gt; &amp;rarr; 편의성의 문제지, 수준의 문제가 아닙니다. 빠르게 시동 걸 땐 여전히 좋아요.&lt;/li&gt;
&lt;li data-end=&quot;2317&quot; data-start=&quot;2153&quot;&gt;&lt;b&gt;&amp;ldquo;pip vs conda?&amp;rdquo;&lt;/b&gt; &amp;rarr; 패키지에 따라 다릅니다. 과학 연산/시스템 의존성이 있는 건 conda가 수월할 때가 많고, 순수 파이썬 패키지는 pip가 더 빠를 때가 있어요. 둘을 같이 써도 되지만, 보통은 conda로 최대한 설치 후 남은 것만 pip로 채웁니다.&lt;/li&gt;
&lt;/ul&gt;
&lt;h2 data-end=&quot;2329&quot; data-start=&quot;2319&quot; data-ke-size=&quot;size26&quot;&gt;개인적인 결론&lt;/h2&gt;
&lt;p data-end=&quot;2499&quot; data-start=&quot;2330&quot; data-ke-size=&quot;size16&quot;&gt;처음엔 아나콘다가 편합니다. 하지만 프로젝트가 늘어날수록 미니콘다의 &amp;ldquo;필요한 것만 갖춘 최소 환경&amp;rdquo;이 관리 스트레스를 줄여줘요. 마트에서 &lt;b&gt;대형 세트&lt;/b&gt;를 한 번에 살지, &lt;b&gt;필요한 재료만&lt;/b&gt; 담을지의 차이랄까요. 저는 대체로 미니콘다 쪽으로 기웁니다.&amp;nbsp;&lt;/p&gt;</description>
      <category>Programming/Python</category>
      <category>Anaconda</category>
      <category>conda</category>
      <category>Miniconda</category>
      <category>python</category>
      <category>가상환경</category>
      <category>데이터분석환경</category>
      <category>패키지관리</category>
      <author>Allen93</author>
      <guid isPermaLink="true">https://allensdatablog.tistory.com/452</guid>
      <comments>https://allensdatablog.tistory.com/entry/%EB%AF%B8%EB%8B%88%EC%BD%98%EB%8B%A4-vs-%EC%95%84%EB%82%98%EC%BD%98%EB%8B%A4-%EB%AD%90%EA%B0%80-%EB%82%B4-%EC%8A%A4%ED%83%80%EC%9D%BC%EC%9D%BC%EA%B9%8C#entry452comment</comments>
      <pubDate>Wed, 19 Nov 2025 19:29:54 +0900</pubDate>
    </item>
    <item>
      <title>Jupyter Notebook을 .py로 변환하는 가장 간단한 방법</title>
      <link>https://allensdatablog.tistory.com/entry/Jupyter-Notebook%EC%9D%84-py%EB%A1%9C-%EB%B3%80%ED%99%98%ED%95%98%EB%8A%94-%EA%B0%80%EC%9E%A5-%EA%B0%84%EB%8B%A8%ED%95%9C-%EB%B0%A9%EB%B2%95</link>
      <description>&lt;p data-end=&quot;143&quot; data-start=&quot;45&quot; data-ke-size=&quot;size16&quot;&gt;노트북으로 실험하다 보면 &amp;ldquo;이 코드 이제 스크립트로 써야겠다&amp;rdquo; 하는 순간이 오죠. 그럴 때 셀마다 복사 붙여넣기 하지 말고, 그냥 한 줄로 .py 파일로 바꾸면 됩니다.&lt;/p&gt;
&lt;h2 data-end=&quot;169&quot; data-start=&quot;145&quot; data-ke-size=&quot;size26&quot;&gt;1️⃣ nbconvert로 변환하기&lt;/h2&gt;
&lt;p data-end=&quot;223&quot; data-start=&quot;170&quot; data-ke-size=&quot;size16&quot;&gt;Jupyter가 이미 설치돼 있다면 바로 터미널(또는 명령 프롬프트)에서 이렇게 입력하세요.&lt;/p&gt;
&lt;div&gt;
&lt;blockquote data-ke-style=&quot;style3&quot;&gt;jupyter nbconvert --to python your_notebook.ipynb&amp;nbsp;&lt;/blockquote&gt;
&lt;/div&gt;
&lt;p data-end=&quot;362&quot; data-start=&quot;286&quot; data-ke-size=&quot;size16&quot;&gt;명령을 실행하면 같은 폴더에 your_notebook.py가 생겨요. 주석으로 셀 구분도 남기 때문에 나중에 다시 보기도 편하죠.&lt;/p&gt;
&lt;blockquote data-end=&quot;418&quot; data-start=&quot;364&quot; data-ke-style=&quot;style1&quot;&gt;
&lt;p data-end=&quot;418&quot; data-start=&quot;366&quot; data-ke-size=&quot;size16&quot;&gt;  예를 들어, EDA.ipynb를 변환하면 EDA.py 파일이 자동 생성됩니다.&lt;/p&gt;
&lt;/blockquote&gt;
&lt;h2 data-end=&quot;445&quot; data-start=&quot;420&quot; data-ke-size=&quot;size26&quot;&gt;&amp;nbsp;&lt;/h2&gt;
&lt;h2 data-end=&quot;445&quot; data-start=&quot;420&quot; data-ke-size=&quot;size26&quot;&gt;2️⃣ JupyterLab에서도 가능&lt;/h2&gt;
&lt;p data-end=&quot;563&quot; data-start=&quot;446&quot; data-ke-size=&quot;size16&quot;&gt;노트북 상단 메뉴에서 &lt;b&gt;File &amp;rarr; Save and Export Notebook As &amp;rarr; Export Notebook to Executable Script&lt;/b&gt; 를 누르면 됩니다. 클릭 한 번으로 끝이에요.&lt;/p&gt;
&lt;h2 data-end=&quot;585&quot; data-start=&quot;565&quot; data-ke-size=&quot;size26&quot;&gt;3️⃣ 왜 이렇게까지 하냐면&lt;/h2&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;690&quot; data-start=&quot;586&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;622&quot; data-start=&quot;586&quot;&gt;코드 리뷰나 버전 관리(git)에 훨씬 깔끔하게 남습니다.&lt;/li&gt;
&lt;li data-end=&quot;657&quot; data-start=&quot;623&quot;&gt;실행 로그나 셀 출력 없이 &amp;ldquo;순수한 코드&amp;rdquo;만 정리돼요.&lt;/li&gt;
&lt;li data-end=&quot;690&quot; data-start=&quot;658&quot;&gt;협업할 때 IDE로 바로 실행할 수 있어서 편하죠.&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-end=&quot;761&quot; data-start=&quot;692&quot; data-ke-size=&quot;size16&quot;&gt;이런 식으로 한 번 변환해두면, 분석용 노트북과 배포용 스크립트를 깔끔히 나눌 수 있어요. 작지만 꽤 똑똑한 습관입니다.&lt;/p&gt;</description>
      <category>Programming/Python</category>
      <category>jupyter</category>
      <category>nbconvert</category>
      <category>python</category>
      <category>개발팁</category>
      <category>데이터분석</category>
      <category>스크립트</category>
      <category>자동화</category>
      <author>Allen93</author>
      <guid isPermaLink="true">https://allensdatablog.tistory.com/451</guid>
      <comments>https://allensdatablog.tistory.com/entry/Jupyter-Notebook%EC%9D%84-py%EB%A1%9C-%EB%B3%80%ED%99%98%ED%95%98%EB%8A%94-%EA%B0%80%EC%9E%A5-%EA%B0%84%EB%8B%A8%ED%95%9C-%EB%B0%A9%EB%B2%95#entry451comment</comments>
      <pubDate>Sat, 15 Nov 2025 19:11:19 +0900</pubDate>
    </item>
    <item>
      <title>파이썬에서 한 단계 올라가기 &amp;mdash; Path.cwd().parent</title>
      <link>https://allensdatablog.tistory.com/entry/%ED%8C%8C%EC%9D%B4%EC%8D%AC%EC%97%90%EC%84%9C-%ED%95%9C-%EB%8B%A8%EA%B3%84-%EC%98%AC%EB%9D%BC%EA%B0%80%EA%B8%B0-%E2%80%94-Pathcwdparent</link>
      <description>&lt;p data-end=&quot;148&quot; data-start=&quot;47&quot; data-ke-size=&quot;size16&quot;&gt;데이터 분석하다 보면 이런 상황 한 번쯤 온다.&lt;br /&gt;노트북(.ipynb)은 notebooks/ 폴더 안에 있는데,&lt;br /&gt;데이터 파일은 바로 위 폴더인 data/에 있다.&lt;/p&gt;
&lt;p data-end=&quot;171&quot; data-start=&quot;150&quot; data-ke-size=&quot;size16&quot;&gt;그래서 매번 이런 짓을 하게 된다:&lt;/p&gt;
&lt;div&gt;
&lt;div&gt;
&lt;blockquote data-ke-style=&quot;style3&quot;&gt;&lt;span style=&quot;color: #333333; letter-spacing: 0px;&quot;&gt;pd.read_csv(&lt;/span&gt;&lt;span style=&quot;color: #333333; letter-spacing: 0px;&quot;&gt;'../data/sales.csv'&lt;/span&gt;&lt;span style=&quot;color: #333333; letter-spacing: 0px;&quot;&gt;)&lt;/span&gt;&lt;/blockquote&gt;
&lt;/div&gt;
&lt;/div&gt;
&lt;p data-end=&quot;295&quot; data-start=&quot;221&quot; data-ke-size=&quot;size16&quot;&gt;그런데 이게 프로젝트 구조가 조금만 달라져도 바로 깨진다.&lt;br /&gt;(예: 노트북을 다른 폴더에서 열었을 때, ../가 안 맞아짐)&lt;/p&gt;
&lt;hr data-end=&quot;300&quot; data-start=&quot;297&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;314&quot; data-start=&quot;302&quot; data-ke-size=&quot;size26&quot;&gt;깔끔한 해결책&lt;/h2&gt;
&lt;p data-end=&quot;346&quot; data-start=&quot;315&quot; data-ke-size=&quot;size16&quot;&gt;pathlib의 Path를 쓰면 딱 정리된다.&lt;/p&gt;
&lt;div&gt;
&lt;div&gt;&amp;nbsp;&lt;/div&gt;
&lt;div&gt;
&lt;pre id=&quot;code_1761642377277&quot; class=&quot;bash&quot; data-ke-language=&quot;bash&quot; data-ke-type=&quot;codeblock&quot;&gt;&lt;code&gt;from pathlib import Path

BASE_DIR = Path.cwd().parent
DATA_DIR = BASE_DIR / &quot;data&quot;&lt;/code&gt;&lt;/pre&gt;
&lt;/div&gt;
&lt;/div&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;532&quot; data-start=&quot;447&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;495&quot; data-start=&quot;447&quot;&gt;Path.cwd() : 현재 작업 디렉터리 (여기선 notebooks/)&lt;/li&gt;
&lt;li data-end=&quot;532&quot; data-start=&quot;496&quot;&gt;.parent : 그 상위 폴더 (즉, 프로젝트 루트)&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-end=&quot;559&quot; data-start=&quot;534&quot; data-ke-size=&quot;size16&quot;&gt;이제 데이터를 읽을 때 이렇게 쓰면 된다.&lt;/p&gt;
&lt;div&gt;
&lt;div&gt;
&lt;div&gt;&amp;nbsp;&lt;/div&gt;
&lt;/div&gt;
&lt;blockquote data-ke-style=&quot;style3&quot;&gt;file = DATA_DIR / &quot;sales.csv&quot;&lt;br /&gt;&lt;span&gt;&lt;span&gt;df = pd.read_csv(file) &lt;/span&gt;&lt;/span&gt;&lt;/blockquote&gt;
&lt;/div&gt;
&lt;p data-end=&quot;667&quot; data-start=&quot;629&quot; data-ke-size=&quot;size16&quot;&gt;딱 봐도 명확하고, ../ 같은 상대경로 게임 안 해도 된다.&lt;/p&gt;
&lt;hr data-end=&quot;672&quot; data-start=&quot;669&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;686&quot; data-start=&quot;674&quot; data-ke-size=&quot;size26&quot;&gt;한 줄로 정리&lt;/h2&gt;
&lt;blockquote data-end=&quot;732&quot; data-start=&quot;687&quot; data-ke-style=&quot;style1&quot;&gt;
&lt;p data-end=&quot;732&quot; data-start=&quot;689&quot; data-ke-size=&quot;size16&quot;&gt;Path.cwd().parent = &amp;ldquo;지금 있는 폴더의 한 단계 위 폴더&amp;rdquo;&lt;/p&gt;
&lt;/blockquote&gt;
&lt;hr data-end=&quot;737&quot; data-start=&quot;734&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;758&quot; data-start=&quot;739&quot; data-ke-size=&quot;size26&quot;&gt;조금 더 예쁘게 쓰는 버전&lt;/h2&gt;
&lt;p data-end=&quot;782&quot; data-start=&quot;759&quot; data-ke-size=&quot;size16&quot;&gt;경로를 print로 찍어서 확인해보자.&lt;/p&gt;
&lt;div&gt;
&lt;div&gt;
&lt;blockquote data-ke-style=&quot;style3&quot;&gt;&lt;span style=&quot;color: #333333; letter-spacing: 0px;&quot;&gt;print&lt;/span&gt;&lt;span style=&quot;color: #333333; letter-spacing: 0px;&quot;&gt;(BASE_DIR)&lt;br /&gt;&lt;/span&gt;&lt;span style=&quot;color: #333333; letter-spacing: 0px;&quot;&gt;# 출력 예시: C:\Users\allen\project&lt;/span&gt;&lt;/blockquote&gt;
&lt;/div&gt;
&lt;/div&gt;
&lt;p data-end=&quot;870&quot; data-start=&quot;847&quot; data-ke-size=&quot;size16&quot;&gt;혹은 여러 단계 위로 올라가고 싶다면:&lt;/p&gt;
&lt;div&gt;
&lt;div&gt;&amp;nbsp;&lt;/div&gt;
&lt;div&gt;
&lt;pre id=&quot;code_1761642421287&quot; class=&quot;bash&quot; data-ke-language=&quot;bash&quot; data-ke-type=&quot;codeblock&quot;&gt;&lt;code&gt;Path.cwd().parents[1]  # 두 단계 위
Path.cwd().parents[2]  # 세 단계 위&lt;/code&gt;&lt;/pre&gt;
&lt;/div&gt;
&lt;/div&gt;
&lt;p data-end=&quot;986&quot; data-start=&quot;949&quot; data-ke-size=&quot;size16&quot;&gt;(부모의 부모의 부모...&amp;nbsp;&lt;/p&gt;
&lt;hr data-end=&quot;991&quot; data-start=&quot;988&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;1001&quot; data-start=&quot;993&quot; data-ke-size=&quot;size26&quot;&gt;마무리&lt;/h2&gt;
&lt;p data-end=&quot;1095&quot; data-start=&quot;1002&quot; data-ke-size=&quot;size16&quot;&gt;이런 식으로 &amp;ldquo;경로를 코드로 표현&amp;rdquo;해두면,&lt;br /&gt;노트북 위치가 바뀌어도 경로가 깨질 일이 없다.&lt;br /&gt;그리고 나중에 팀원이 받아도, 폴더 이름만 같으면 바로 돌아간다.&lt;/p&gt;
&lt;p data-end=&quot;1125&quot; data-start=&quot;1097&quot; data-ke-size=&quot;size16&quot;&gt;작은 습관 하나로 &amp;ldquo;경로 지옥&amp;rdquo;에서 탈출 가능.&lt;/p&gt;</description>
      <category>Programming/Python</category>
      <category>OS</category>
      <category>pathlib</category>
      <category>python</category>
      <category>개발</category>
      <category>데이터분석</category>
      <category>코드</category>
      <category>파이썬</category>
      <category>파일경로</category>
      <author>Allen93</author>
      <guid isPermaLink="true">https://allensdatablog.tistory.com/450</guid>
      <comments>https://allensdatablog.tistory.com/entry/%ED%8C%8C%EC%9D%B4%EC%8D%AC%EC%97%90%EC%84%9C-%ED%95%9C-%EB%8B%A8%EA%B3%84-%EC%98%AC%EB%9D%BC%EA%B0%80%EA%B8%B0-%E2%80%94-Pathcwdparent#entry450comment</comments>
      <pubDate>Tue, 11 Nov 2025 19:07:43 +0900</pubDate>
    </item>
    <item>
      <title>conda 가상환경에서 Jupyter Notebook 실행하기 &amp;mdash; 가장 깔끔한 방법</title>
      <link>https://allensdatablog.tistory.com/entry/conda-%EA%B0%80%EC%83%81%ED%99%98%EA%B2%BD%EC%97%90%EC%84%9C-Jupyter-Notebook-%EC%8B%A4%ED%96%89%ED%95%98%EA%B8%B0-%E2%80%94-%EA%B0%80%EC%9E%A5-%EA%B9%94%EB%81%94%ED%95%9C-%EB%B0%A9%EB%B2%95</link>
      <description>&lt;p data-end=&quot;70&quot; data-start=&quot;52&quot; data-ke-size=&quot;size16&quot;&gt;많은 초보 개발자들이 묻는다.&lt;/p&gt;
&lt;blockquote data-end=&quot;132&quot; data-start=&quot;71&quot; data-ke-style=&quot;style1&quot;&gt;
&lt;p data-end=&quot;132&quot; data-start=&quot;73&quot; data-ke-size=&quot;size16&quot;&gt;&amp;ldquo;내가 만든 conda 가상환경에서 Jupyter Notebook을 바로 열려면 어떻게 해야 하나요?&amp;rdquo;&lt;/p&gt;
&lt;/blockquote&gt;
&lt;p data-end=&quot;171&quot; data-start=&quot;134&quot; data-ke-size=&quot;size16&quot;&gt;아래 순서 한 번 익혀두면, 어떤 환경에서도 바로 쓸 수 있다.&lt;/p&gt;
&lt;hr data-end=&quot;176&quot; data-start=&quot;173&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;202&quot; data-start=&quot;178&quot; data-ke-size=&quot;size26&quot;&gt;1️⃣ Jupyter 설치 (한 번만)&lt;/h2&gt;
&lt;p data-end=&quot;224&quot; data-start=&quot;203&quot; data-ke-size=&quot;size16&quot;&gt;가상환경을 먼저 활성화한 뒤 설치한다.&lt;/p&gt;
&lt;div&gt;
&lt;div&gt;
&lt;div&gt;&amp;nbsp;&lt;/div&gt;
&lt;/div&gt;
&lt;div&gt;
&lt;pre id=&quot;code_1761642056624&quot; class=&quot;bash&quot; data-ke-language=&quot;bash&quot; data-ke-type=&quot;codeblock&quot;&gt;&lt;code&gt;conda activate my_env
conda install notebook ipykernel&lt;/code&gt;&lt;/pre&gt;
&lt;/div&gt;
&lt;/div&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;377&quot; data-start=&quot;294&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;326&quot; data-start=&quot;294&quot;&gt;notebook &amp;rarr; Jupyter 노트북 실행용&lt;/li&gt;
&lt;li data-end=&quot;377&quot; data-start=&quot;327&quot;&gt;ipykernel &amp;rarr; 현재 가상환경을 Jupyter에서 커널(실행 엔진)로 등록&lt;/li&gt;
&lt;/ul&gt;
&lt;hr data-end=&quot;382&quot; data-start=&quot;379&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;411&quot; data-start=&quot;384&quot; data-ke-size=&quot;size26&quot;&gt;2️⃣ 내 환경을 커널로 등록 (딱 한 번)&lt;/h2&gt;
&lt;div&gt;
&lt;div&gt;
&lt;div&gt;&amp;nbsp;&lt;/div&gt;
&lt;/div&gt;
&lt;blockquote data-ke-style=&quot;style3&quot;&gt;python -m ipykernel install --user --name my_env --display-name &quot;my_env&quot;&lt;/blockquote&gt;
&lt;/div&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;599&quot; data-start=&quot;498&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;535&quot; data-start=&quot;498&quot;&gt;--name : 시스템 내부 식별용 이름 (소문자 권장)&lt;/li&gt;
&lt;li data-end=&quot;599&quot; data-start=&quot;536&quot;&gt;--display-name : JupyterLab / Notebook에서 보일 이름 (영문&amp;middot;한글 가능)&lt;/li&gt;
&lt;/ul&gt;
&lt;hr data-end=&quot;604&quot; data-start=&quot;601&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;617&quot; data-start=&quot;606&quot; data-ke-size=&quot;size26&quot;&gt;3️⃣ 실행하기&lt;/h2&gt;
&lt;p data-end=&quot;642&quot; data-start=&quot;618&quot; data-ke-size=&quot;size16&quot;&gt;가상환경을 다시 활성화한 뒤 노트북을 연다.&lt;/p&gt;
&lt;div&gt;
&lt;div&gt;
&lt;blockquote data-ke-style=&quot;style3&quot;&gt;&lt;span style=&quot;color: #333333; letter-spacing: 0px;&quot;&gt;conda activate my_env jupyter notebook&lt;/span&gt;&lt;/blockquote&gt;
&lt;/div&gt;
&lt;/div&gt;
&lt;p data-end=&quot;747&quot; data-start=&quot;696&quot; data-ke-size=&quot;size16&quot;&gt;자동으로 브라우저가 열리고, 지정 폴더에서 .ipynb 파일을 만들거나 불러올 수 있다.&lt;/p&gt;
&lt;hr data-end=&quot;752&quot; data-start=&quot;749&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;776&quot; data-start=&quot;754&quot; data-ke-size=&quot;size26&quot;&gt;4️⃣ JupyterLab 도 동일&lt;/h2&gt;
&lt;div&gt;
&lt;div&gt;
&lt;div&gt;&amp;nbsp;&lt;/div&gt;
&lt;/div&gt;
&lt;blockquote data-ke-style=&quot;style3&quot;&gt;conda activate my_env&lt;br /&gt;&lt;span&gt;&lt;span&gt;jupyter lab &lt;/span&gt;&lt;/span&gt;&lt;/blockquote&gt;
&lt;/div&gt;
&lt;p data-end=&quot;887&quot; data-start=&quot;823&quot; data-ke-size=&quot;size16&quot;&gt;JupyterLab은 노트북 + 터미널 + 파일탐색기가 통합된 환경이라,&lt;br /&gt;작업 규모가 커질수록 훨씬 편하다.&lt;/p&gt;
&lt;hr data-end=&quot;892&quot; data-start=&quot;889&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;904&quot; data-start=&quot;894&quot; data-ke-size=&quot;size26&quot;&gt;요약 정리&lt;/h2&gt;
&lt;div&gt;
&lt;div&gt;&lt;b&gt;단계&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 명령어&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;설명&lt;/b&gt;
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-end=&quot;1230&quot; data-start=&quot;906&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody data-end=&quot;1230&quot; data-start=&quot;949&quot;&gt;
&lt;tr data-end=&quot;999&quot; data-start=&quot;949&quot;&gt;
&lt;td data-col-size=&quot;sm&quot; data-end=&quot;960&quot; data-start=&quot;949&quot;&gt;가상환경 활성화&lt;/td&gt;
&lt;td data-end=&quot;986&quot; data-start=&quot;960&quot; data-col-size=&quot;md&quot;&gt;conda activate my_env&lt;/td&gt;
&lt;td data-end=&quot;999&quot; data-start=&quot;986&quot; data-col-size=&quot;sm&quot;&gt;작업할 환경 진입&lt;/td&gt;
&lt;/tr&gt;
&lt;tr data-end=&quot;1065&quot; data-start=&quot;1000&quot;&gt;
&lt;td data-col-size=&quot;sm&quot; data-end=&quot;1013&quot; data-start=&quot;1000&quot;&gt;Jupyter 설치&lt;/td&gt;
&lt;td data-end=&quot;1050&quot; data-start=&quot;1013&quot; data-col-size=&quot;md&quot;&gt;conda install notebook ipykernel&lt;/td&gt;
&lt;td data-end=&quot;1065&quot; data-start=&quot;1050&quot; data-col-size=&quot;sm&quot;&gt;노트북 &amp;amp; 커널 설치&lt;/td&gt;
&lt;/tr&gt;
&lt;tr data-end=&quot;1173&quot; data-start=&quot;1066&quot;&gt;
&lt;td data-col-size=&quot;sm&quot; data-end=&quot;1074&quot; data-start=&quot;1066&quot;&gt;커널 등록&lt;/td&gt;
&lt;td data-end=&quot;1151&quot; data-start=&quot;1074&quot; data-col-size=&quot;md&quot;&gt;python -m ipykernel install --user --name my_env --display-name &quot;my_env&quot;&lt;/td&gt;
&lt;td data-end=&quot;1173&quot; data-start=&quot;1151&quot; data-col-size=&quot;sm&quot;&gt;Jupyter에서 인식하도록 등록&lt;/td&gt;
&lt;/tr&gt;
&lt;tr data-end=&quot;1230&quot; data-start=&quot;1174&quot;&gt;
&lt;td data-col-size=&quot;sm&quot; data-end=&quot;1179&quot; data-start=&quot;1174&quot;&gt;실행&lt;/td&gt;
&lt;td data-col-size=&quot;md&quot; data-end=&quot;1216&quot; data-start=&quot;1179&quot;&gt;jupyter notebook / jupyter lab&lt;/td&gt;
&lt;td data-end=&quot;1230&quot; data-start=&quot;1216&quot; data-col-size=&quot;sm&quot;&gt;브라우저 자동 실행&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;/div&gt;
&lt;/div&gt;
&lt;hr data-end=&quot;1235&quot; data-start=&quot;1232&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;1248&quot; data-start=&quot;1237&quot; data-ke-size=&quot;size26&quot;&gt;기억 포인트&lt;/h2&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;1381&quot; data-start=&quot;1249&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;1279&quot; data-start=&quot;1249&quot;&gt;커널 등록은 &lt;b&gt;환경당 한 번&lt;/b&gt;만 해도 된다.&lt;/li&gt;
&lt;li data-end=&quot;1334&quot; data-start=&quot;1280&quot;&gt;이후에는 그냥 conda activate &amp;rarr; jupyter notebook 순서면 끝.&lt;/li&gt;
&lt;li data-end=&quot;1381&quot; data-start=&quot;1335&quot;&gt;여러 환경을 쓸 땐, Jupyter 상단 메뉴에서 커널 이름으로 전환 가능.&lt;/li&gt;
&lt;/ul&gt;</description>
      <category>Programming/etc</category>
      <category>conda</category>
      <category>ipykernel</category>
      <category>jupyter</category>
      <category>python</category>
      <category>가상환경</category>
      <category>개발환경</category>
      <category>데이터분석</category>
      <author>Allen93</author>
      <guid isPermaLink="true">https://allensdatablog.tistory.com/449</guid>
      <comments>https://allensdatablog.tistory.com/entry/conda-%EA%B0%80%EC%83%81%ED%99%98%EA%B2%BD%EC%97%90%EC%84%9C-Jupyter-Notebook-%EC%8B%A4%ED%96%89%ED%95%98%EA%B8%B0-%E2%80%94-%EA%B0%80%EC%9E%A5-%EA%B9%94%EB%81%94%ED%95%9C-%EB%B0%A9%EB%B2%95#entry449comment</comments>
      <pubDate>Sun, 9 Nov 2025 19:03:52 +0900</pubDate>
    </item>
    <item>
      <title>파이썬 가상환경, 진짜로 알아두면 편한 이유</title>
      <link>https://allensdatablog.tistory.com/entry/%ED%8C%8C%EC%9D%B4%EC%8D%AC-%EA%B0%80%EC%83%81%ED%99%98%EA%B2%BD-%EC%A7%84%EC%A7%9C%EB%A1%9C-%EC%95%8C%EC%95%84%EB%91%90%EB%A9%B4-%ED%8E%B8%ED%95%9C-%EC%9D%B4%EC%9C%A0</link>
      <description>&lt;h2 data-end=&quot;48&quot; data-start=&quot;30&quot; data-ke-size=&quot;size26&quot;&gt;왜 굳이 가상환경을 쓸까&lt;/h2&gt;
&lt;p data-end=&quot;133&quot; data-start=&quot;49&quot; data-ke-size=&quot;size16&quot;&gt;프로젝트마다 사용하는 &lt;b&gt;라이브러리 버전이 다르기 때문&lt;/b&gt;이다.&lt;br /&gt;하나의 파이썬에 모든 걸 깔면, 서로 버전이 충돌해 코드가 깨지는 일이 생긴다.&lt;/p&gt;
&lt;p data-end=&quot;213&quot; data-start=&quot;135&quot; data-ke-size=&quot;size16&quot;&gt;가상환경은 말 그대로 &amp;ldquo;&lt;b&gt;격리된 파이썬 공간&lt;/b&gt;&amp;rdquo;이다.&lt;br /&gt;프로젝트마다 독립된 환경을 만들어, 다른 프로젝트와 영향을 주고받지 않는다.&lt;/p&gt;
&lt;hr data-end=&quot;218&quot; data-start=&quot;215&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;239&quot; data-start=&quot;220&quot; data-ke-size=&quot;size26&quot;&gt;기본 세팅 &amp;mdash; venv&lt;/h2&gt;
&lt;h3 data-end=&quot;257&quot; data-start=&quot;241&quot; data-ke-size=&quot;size23&quot;&gt;1. 가상환경 생성&lt;/h3&gt;
&lt;div&gt;
&lt;div&gt;
&lt;div&gt;
&lt;pre id=&quot;code_1761641489349&quot; class=&quot;python&quot; data-ke-language=&quot;python&quot; data-ke-type=&quot;codeblock&quot;&gt;&lt;code&gt;python -m venv venv&lt;/code&gt;&lt;/pre&gt;
&lt;/div&gt;
&lt;/div&gt;
&lt;div&gt;&amp;nbsp;&lt;/div&gt;
&lt;/div&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;394&quot; data-start=&quot;290&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;326&quot; data-start=&quot;290&quot;&gt;venv는 폴더 이름이다. 보통 프로젝트 루트에 둔다.&lt;/li&gt;
&lt;li data-end=&quot;394&quot; data-start=&quot;327&quot;&gt;실행 후 venv/ 폴더 안에 Scripts(Windows) 혹은 bin(Mac/Linux)이 생긴다.&lt;/li&gt;
&lt;/ul&gt;
&lt;h3 data-end=&quot;413&quot; data-start=&quot;396&quot; data-ke-size=&quot;size23&quot;&gt;2. 가상환경 활성화&lt;/h3&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;526&quot; data-start=&quot;414&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;467&quot; data-start=&quot;414&quot;&gt;&lt;b&gt;Windows&lt;/b&gt;
&lt;div&gt;&amp;nbsp;&lt;/div&gt;
&lt;div&gt;&amp;nbsp;&lt;/div&gt;
&lt;/li&gt;
&lt;li data-end=&quot;526&quot; data-start=&quot;468&quot;&gt;&lt;b&gt;Mac/Linux&lt;/b&gt;
&lt;div&gt;&amp;nbsp;&lt;/div&gt;
&lt;div&gt;&amp;nbsp;&lt;/div&gt;
&lt;/li&gt;
&lt;/ul&gt;
&lt;pre id=&quot;code_1761641652416&quot; class=&quot;bash&quot; data-ke-language=&quot;bash&quot; data-ke-type=&quot;codeblock&quot;&gt;&lt;code&gt;source venv/bin/activate&lt;/code&gt;&lt;/pre&gt;
&lt;p data-end=&quot;557&quot; data-start=&quot;527&quot; data-ke-size=&quot;size16&quot;&gt;활성화되면 프롬프트에 (venv)처럼 표시된다.&lt;/p&gt;
&lt;h3 data-end=&quot;572&quot; data-start=&quot;559&quot; data-ke-size=&quot;size23&quot;&gt;3. 비활성화&lt;/h3&gt;
&lt;div&gt;
&lt;div&gt;
&lt;div&gt;&amp;nbsp;&lt;/div&gt;
&lt;/div&gt;
&lt;div&gt;
&lt;pre id=&quot;code_1761641665356&quot; class=&quot;bash&quot; data-ke-language=&quot;bash&quot; data-ke-type=&quot;codeblock&quot;&gt;&lt;code&gt;deactivate&lt;/code&gt;&lt;/pre&gt;
&lt;/div&gt;
&lt;/div&gt;
&lt;hr data-end=&quot;600&quot; data-start=&quot;597&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;613&quot; data-start=&quot;602&quot; data-ke-size=&quot;size26&quot;&gt;설치와 관리&lt;/h2&gt;
&lt;p data-end=&quot;652&quot; data-start=&quot;614&quot; data-ke-size=&quot;size16&quot;&gt;가상환경 안에서는 &lt;b&gt;pip가 자동으로 해당 환경에 설치&lt;/b&gt;된다.&lt;/p&gt;
&lt;div&gt;
&lt;div&gt;
&lt;div&gt;&amp;nbsp;&lt;/div&gt;
&lt;/div&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;pip install pandas matplotlib&amp;nbsp;&lt;/blockquote&gt;
&lt;/div&gt;
&lt;p data-end=&quot;736&quot; data-start=&quot;697&quot; data-ke-size=&quot;size16&quot;&gt;다른 환경이나 서버에서 같은 구성을 재현하려면 다음처럼 저장해둔다.&lt;/p&gt;
&lt;div&gt;
&lt;div&gt;
&lt;div&gt;&amp;nbsp;&lt;/div&gt;
&lt;/div&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;pip freeze &amp;gt; requirements.txt&amp;nbsp;&lt;/blockquote&gt;
&lt;/div&gt;
&lt;p data-end=&quot;793&quot; data-start=&quot;780&quot; data-ke-size=&quot;size16&quot;&gt;그리고 다시 설치할 땐:&lt;/p&gt;
&lt;div&gt;
&lt;div&gt;
&lt;div&gt;&amp;nbsp;&lt;/div&gt;
&lt;/div&gt;
&lt;div&gt;&lt;span&gt;&lt;span&gt;pip install -r requirements.txt &lt;/span&gt;&lt;/span&gt;&lt;/div&gt;
&lt;/div&gt;
&lt;blockquote data-end=&quot;880&quot; data-start=&quot;839&quot; data-ke-style=&quot;style1&quot;&gt;
&lt;p data-end=&quot;880&quot; data-start=&quot;841&quot; data-ke-size=&quot;size16&quot;&gt;✅ requirements.txt는 협업이나 배포 때 거의 필수다.&lt;/p&gt;
&lt;/blockquote&gt;
&lt;hr data-end=&quot;885&quot; data-start=&quot;882&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;909&quot; data-start=&quot;887&quot; data-ke-size=&quot;size26&quot;&gt;venv 폴더를 깃에서 제외하기&lt;/h2&gt;
&lt;p data-end=&quot;976&quot; data-start=&quot;910&quot; data-ke-size=&quot;size16&quot;&gt;가상환경은 용량이 크고, OS마다 구조가 달라 공유할 이유가 없다.&lt;br /&gt;.gitignore에 아래 한 줄 넣자.&lt;/p&gt;
&lt;div&gt;
&lt;div&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;&lt;span style=&quot;color: #333333; letter-spacing: 0px;&quot;&gt;venv/&lt;/span&gt;&lt;/blockquote&gt;
&lt;/div&gt;
&lt;/div&gt;
&lt;hr data-end=&quot;995&quot; data-start=&quot;992&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;1013&quot; data-start=&quot;997&quot; data-ke-size=&quot;size26&quot;&gt;가상환경 이름 바꾸기&lt;/h2&gt;
&lt;p data-end=&quot;1111&quot; data-start=&quot;1014&quot; data-ke-size=&quot;size16&quot;&gt;python -m venv .env 처럼 이름을 .env, .venv, env 등으로 바꿔도 무방하다.&lt;br /&gt;VSCode나 PyCharm은 자동으로 인식한다.&lt;/p&gt;
&lt;hr data-end=&quot;1116&quot; data-start=&quot;1113&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;1165&quot; data-start=&quot;1118&quot; data-ke-size=&quot;size26&quot;&gt;조금 더 편하게 &amp;mdash; virtualenv, pipenv, conda&lt;/h2&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;1311&quot; data-start=&quot;1166&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;1209&quot; data-start=&quot;1166&quot;&gt;virtualenv: venv보다 유연하지만 거의 비슷한 기능.&lt;/li&gt;
&lt;li data-end=&quot;1262&quot; data-start=&quot;1210&quot;&gt;pipenv: 의존성 관리에 초점을 둔 도구. Pipfile로 버전 고정 가능.&lt;/li&gt;
&lt;li data-end=&quot;1311&quot; data-start=&quot;1263&quot;&gt;conda: 데이터 분석&amp;middot;머신러닝용. 패키지와 파이썬 자체를 함께 관리한다.&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-end=&quot;1369&quot; data-start=&quot;1313&quot; data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;데이터 분석 쪽&lt;/b&gt;이라면 conda,&lt;br /&gt;&lt;b&gt;일반 파이썬 프로젝트&lt;/b&gt;라면 venv면 충분하다.&lt;/p&gt;
&lt;hr data-end=&quot;1374&quot; data-start=&quot;1371&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;1386&quot; data-start=&quot;1376&quot; data-ke-size=&quot;size26&quot;&gt;간단 요약&lt;/h2&gt;
&lt;div&gt;
&lt;div&gt;&lt;b&gt;작업&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 명령어&lt;/b&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-end=&quot;1637&quot; data-start=&quot;1388&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody data-end=&quot;1637&quot; data-start=&quot;1419&quot;&gt;
&lt;tr data-end=&quot;1454&quot; data-start=&quot;1419&quot;&gt;
&lt;td data-col-size=&quot;sm&quot; data-end=&quot;1429&quot; data-start=&quot;1419&quot;&gt;가상환경 생성&lt;/td&gt;
&lt;td data-end=&quot;1454&quot; data-start=&quot;1429&quot; data-col-size=&quot;md&quot;&gt;python -m venv venv&lt;/td&gt;
&lt;/tr&gt;
&lt;tr data-end=&quot;1536&quot; data-start=&quot;1455&quot;&gt;
&lt;td data-col-size=&quot;sm&quot; data-end=&quot;1461&quot; data-start=&quot;1455&quot;&gt;활성화&lt;/td&gt;
&lt;td data-end=&quot;1536&quot; data-start=&quot;1461&quot; data-col-size=&quot;md&quot;&gt;venv\Scripts\activate (Win)&lt;br /&gt;source venv/bin/activate (Mac/Linux)&lt;/td&gt;
&lt;/tr&gt;
&lt;tr data-end=&quot;1568&quot; data-start=&quot;1537&quot;&gt;
&lt;td data-col-size=&quot;sm&quot; data-end=&quot;1546&quot; data-start=&quot;1537&quot;&gt;패키지 설치&lt;/td&gt;
&lt;td data-end=&quot;1568&quot; data-start=&quot;1546&quot; data-col-size=&quot;md&quot;&gt;pip install 패키지명&lt;/td&gt;
&lt;/tr&gt;
&lt;tr data-end=&quot;1613&quot; data-start=&quot;1569&quot;&gt;
&lt;td data-col-size=&quot;sm&quot; data-end=&quot;1578&quot; data-start=&quot;1569&quot;&gt;의존성 저장&lt;/td&gt;
&lt;td data-end=&quot;1613&quot; data-start=&quot;1578&quot; data-col-size=&quot;md&quot;&gt;pip freeze &amp;gt; requirements.txt&lt;/td&gt;
&lt;/tr&gt;
&lt;tr data-end=&quot;1637&quot; data-start=&quot;1614&quot;&gt;
&lt;td data-col-size=&quot;sm&quot; data-end=&quot;1621&quot; data-start=&quot;1614&quot;&gt;비활성화&lt;/td&gt;
&lt;td data-end=&quot;1637&quot; data-start=&quot;1621&quot; data-col-size=&quot;md&quot;&gt;deactivate&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;/div&gt;
&lt;/div&gt;
&lt;hr data-end=&quot;1642&quot; data-start=&quot;1639&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;1652&quot; data-start=&quot;1644&quot; data-ke-size=&quot;size26&quot;&gt;마무리&lt;/h2&gt;
&lt;p data-end=&quot;1766&quot; data-start=&quot;1653&quot; data-ke-size=&quot;size16&quot;&gt;가상환경은 &amp;ldquo;언제 써야 할까?&amp;rdquo;가 아니라 &amp;ldquo;&lt;b&gt;안 쓰면 언제 터질까&lt;/b&gt;&amp;rdquo;에 가까운 문제다.&lt;br /&gt;습관처럼 프로젝트마다 하나씩 만들어 두면,&lt;br /&gt;나중에 꼬이지 않는다 &amp;mdash; 조용하지만 가장 효율적인 예방책이다.&lt;/p&gt;</description>
      <category>Programming/Python</category>
      <category>python</category>
      <category>venv</category>
      <category>가상환경</category>
      <category>개발환경</category>
      <category>파이썬</category>
      <author>Allen93</author>
      <guid isPermaLink="true">https://allensdatablog.tistory.com/448</guid>
      <comments>https://allensdatablog.tistory.com/entry/%ED%8C%8C%EC%9D%B4%EC%8D%AC-%EA%B0%80%EC%83%81%ED%99%98%EA%B2%BD-%EC%A7%84%EC%A7%9C%EB%A1%9C-%EC%95%8C%EC%95%84%EB%91%90%EB%A9%B4-%ED%8E%B8%ED%95%9C-%EC%9D%B4%EC%9C%A0#entry448comment</comments>
      <pubDate>Thu, 6 Nov 2025 18:57:33 +0900</pubDate>
    </item>
    <item>
      <title>pathlib.Path 한 번에 잡기: 실전 위주 가이드</title>
      <link>https://allensdatablog.tistory.com/entry/pathlibPath-%ED%95%9C-%EB%B2%88%EC%97%90-%EC%9E%A1%EA%B8%B0-%EC%8B%A4%EC%A0%84-%EC%9C%84%EC%A3%BC-%EA%B0%80%EC%9D%B4%EB%93%9C</link>
      <description>&lt;h2 data-end=&quot;45&quot; data-start=&quot;37&quot; data-ke-size=&quot;size26&quot;&gt;핵심 요약&lt;/h2&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;225&quot; data-start=&quot;46&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;94&quot; data-start=&quot;46&quot;&gt;Path는 &lt;b&gt;문자열이 아닌 &amp;ldquo;경로 객체&amp;rdquo;&lt;/b&gt;로 파일&amp;middot;디렉터리를 다루게 해준다.&lt;/li&gt;
&lt;li data-end=&quot;132&quot; data-start=&quot;95&quot;&gt;운영체제별 경로 차이(슬래시/백슬래시)를 &lt;b&gt;자동 처리&lt;/b&gt;한다.&lt;/li&gt;
&lt;li data-end=&quot;176&quot; data-start=&quot;133&quot;&gt;읽기/쓰기, 생성/삭제, 탐색(glob)까지 &lt;b&gt;직관적인 메서드&lt;/b&gt; 제공.&lt;/li&gt;
&lt;li data-end=&quot;225&quot; data-start=&quot;177&quot;&gt;이제 os.path/문자열 더하기 대신 &lt;b&gt;연산자(/)로 경로 조합&lt;/b&gt;하자.&lt;/li&gt;
&lt;/ul&gt;
&lt;hr data-end=&quot;230&quot; data-start=&quot;227&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;246&quot; data-start=&quot;232&quot; data-ke-size=&quot;size26&quot;&gt;왜 Path인가?&lt;/h2&gt;
&lt;p data-end=&quot;293&quot; data-start=&quot;247&quot; data-ke-size=&quot;size16&quot;&gt;문자열 기반 경로는 덧셈(+)과 구분자 처리에서 자주 꼬인다. Path는&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;421&quot; data-start=&quot;294&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;331&quot; data-start=&quot;294&quot;&gt;a / b처럼 &lt;b&gt;연산자 오버로딩&lt;/b&gt;으로 경로를 합치고,&lt;/li&gt;
&lt;li data-end=&quot;387&quot; data-start=&quot;332&quot;&gt;Path.home() 같은 &lt;b&gt;유틸리티&lt;/b&gt;로 사용자 홈, 현재 디렉터리 등을 쉽게 얻고,&lt;/li&gt;
&lt;li data-end=&quot;421&quot; data-start=&quot;388&quot;&gt;&lt;b&gt;파일 I/O 메서드&lt;/b&gt;를 바로 붙여 쓸 수 있다.&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-end=&quot;457&quot; data-start=&quot;423&quot; data-ke-size=&quot;size16&quot;&gt;즉, 덜 쓰고, 더 안전하고, 더 읽기 쉬운 코드가 된다.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h2 data-end=&quot;457&quot; data-start=&quot;423&quot; data-ke-size=&quot;size26&quot;&gt;기본 사용&lt;/h2&gt;
&lt;pre id=&quot;code_1761641151015&quot; class=&quot;python&quot; data-ke-language=&quot;python&quot; data-ke-type=&quot;codeblock&quot;&gt;&lt;code&gt;from pathlib import Path

p = Path(&quot;data&quot;) / &quot;input&quot; / &quot;file.txt&quot;   # 경로 조합
print(p)                                   # 운영체제에 맞는 경로 문자열 출력
print(p.exists(), p.is_file(), p.is_dir()) # 존재/파일/폴더 판별&lt;/code&gt;&lt;/pre&gt;
&lt;p data-end=&quot;457&quot; data-start=&quot;423&quot; data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;721&quot; data-start=&quot;686&quot;&gt;/ 연산자는 문자열 연결이 아니라 &lt;b&gt;경로 결합&lt;/b&gt;이다.&lt;/li&gt;
&lt;li data-end=&quot;767&quot; data-start=&quot;722&quot;&gt;exists(), is_file(), is_dir()로 상태 확인.&lt;/li&gt;
&lt;/ul&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;흔한 시작점&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;pre id=&quot;code_1761641183699&quot; class=&quot;python&quot; data-ke-language=&quot;python&quot; data-ke-type=&quot;codeblock&quot;&gt;&lt;code&gt;Path.cwd()      # 현재 작업 디렉터리
Path.home()     # 사용자 홈 디렉터리
Path(__file__)  # 현재 파이썬 파일의 경로 (스크립트에서 유용)&lt;/code&gt;&lt;/pre&gt;
&lt;p data-end=&quot;457&quot; data-start=&quot;423&quot; data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;Path 스타일 vs pathlib 스타일&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;하고 싶은 일&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; os.path 스타일&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; pathlib 스타일&lt;/b&gt;&lt;/p&gt;
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody&gt;
&lt;tr&gt;
&lt;td&gt;경로 결합&lt;/td&gt;
&lt;td&gt;os.path.join(a, b)&lt;/td&gt;
&lt;td&gt;Path(a) / b&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;절대경로&lt;/td&gt;
&lt;td&gt;os.path.abspath(p)&lt;/td&gt;
&lt;td&gt;Path(p).resolve()&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;확장자&lt;/td&gt;
&lt;td&gt;os.path.splitext(p)&lt;/td&gt;
&lt;td&gt;Path(p).suffix, stem&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;존재 확인&lt;/td&gt;
&lt;td&gt;os.path.exists(p)&lt;/td&gt;
&lt;td&gt;Path(p).exists()&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;디렉터리 여부&lt;/td&gt;
&lt;td&gt;os.path.isdir(p)&lt;/td&gt;
&lt;td&gt;Path(p).is_dir()&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;순회&lt;/td&gt;
&lt;td&gt;os.walk(root)&lt;/td&gt;
&lt;td&gt;Path(root).rglob(&quot;*&quot;) 등&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;p data-end=&quot;457&quot; data-start=&quot;423&quot; data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;blockquote data-end=&quot;457&quot; data-start=&quot;423&quot; data-ke-style=&quot;style2&quot;&gt;팁: 기존 코드에 Path만 도입해도 가독성이 확 올라간다.&lt;br /&gt;완전 전환은 점진적으로(os 일부 유지) 진행해도 된다.&lt;/blockquote&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;hr data-end=&quot;4201&quot; data-start=&quot;4198&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;4209&quot; data-start=&quot;4203&quot; data-ke-size=&quot;size26&quot;&gt;마무리&lt;/h2&gt;
&lt;p data-end=&quot;4305&quot; data-start=&quot;4210&quot; data-ke-size=&quot;size16&quot;&gt;Path는 &amp;ldquo;경로를 문자열처럼 대충 다루지 말자&amp;rdquo;는 제안이다.&lt;br /&gt;파일&amp;middot;폴더 조작이 많은 프로젝트일수록 유지보수가 쉬워진다. 지금 쓰는 스크립트에 한 줄부터 바꿔보자:&lt;/p&gt;
&lt;pre id=&quot;code_1761641295884&quot; class=&quot;python&quot; data-ke-language=&quot;python&quot; data-ke-type=&quot;codeblock&quot;&gt;&lt;code&gt;from pathlib import Path
DATA = Path(&quot;data&quot;)&lt;/code&gt;&lt;/pre&gt;</description>
      <category>Programming/Python</category>
      <category>path</category>
      <category>pathlib</category>
      <category>python</category>
      <category>경로</category>
      <category>경로관리</category>
      <category>파일입출력</category>
      <author>Allen93</author>
      <guid isPermaLink="true">https://allensdatablog.tistory.com/447</guid>
      <comments>https://allensdatablog.tistory.com/entry/pathlibPath-%ED%95%9C-%EB%B2%88%EC%97%90-%EC%9E%A1%EA%B8%B0-%EC%8B%A4%EC%A0%84-%EC%9C%84%EC%A3%BC-%EA%B0%80%EC%9D%B4%EB%93%9C#entry447comment</comments>
      <pubDate>Mon, 3 Nov 2025 18:48:42 +0900</pubDate>
    </item>
    <item>
      <title>3. 표본추출의 기본 - 좋은 데이터는 그냥 만들어지지 않아요</title>
      <link>https://allensdatablog.tistory.com/entry/3-%ED%91%9C%EB%B3%B8%EC%B6%94%EC%B6%9C%EC%9D%98-%EA%B8%B0%EB%B3%B8-%EC%A2%8B%EC%9D%80-%EB%8D%B0%EC%9D%B4%ED%84%B0%EB%8A%94-%EA%B7%B8%EB%83%A5-%EB%A7%8C%EB%93%A4%EC%96%B4%EC%A7%80%EC%A7%80-%EC%95%8A%EC%95%84%EC%9A%94</link>
      <description>&lt;h3 data-ke-size=&quot;size23&quot;&gt;1. &quot;그냥 랜덤하게 뽑으면 되지 않나요?&quot;&lt;/h3&gt;
&lt;p&gt;&lt;figure class=&quot;imageblock alignCenter&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;1024&quot; data-origin-height=&quot;1024&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/bcqQqP/dJMcagqe2mp/5hz6fQpnJVMvpWLKWohvFK/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/bcqQqP/dJMcagqe2mp/5hz6fQpnJVMvpWLKWohvFK/img.png&quot; data-alt=&quot;표본추출&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/bcqQqP/dJMcagqe2mp/5hz6fQpnJVMvpWLKWohvFK/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2FbcqQqP%2FdJMcagqe2mp%2F5hz6fQpnJVMvpWLKWohvFK%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;530&quot; height=&quot;530&quot; data-origin-width=&quot;1024&quot; data-origin-height=&quot;1024&quot;/&gt;&lt;/span&gt;&lt;figcaption&gt;표본추출&lt;/figcaption&gt;
&lt;/figure&gt;
&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;데이터를 다루다 보면 이런 생각이 듭니다.&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;&quot;표본추출은 그냥 무작위(random)로 뽑으면 되는 거 아닌가요?&quot;&lt;/blockquote&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;맞아요, 기본적으로 &lt;b&gt;무작위성(randomness)&lt;/b&gt;은 중요합니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;하지만 '어떻게' 무작위로 뽑느냐가 훨씬 중요하죠.&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;아무리 많은 데이터를 모아도, 애초에 &lt;b&gt;뽑는 과정이 치우쳐 있다면&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;결과는 이미 편향되어 있습니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;예를 들어 차량 고장 데이터를 분석한다고 해봅시다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;최근 몇 달간의 데이터만 모았는데,&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;그 시기가 우연히 여름철이라면?&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;결국 &lt;b&gt;기온이 높은 계절만의 특성이 반영된 표본&lt;/b&gt;이 될 수 있어요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이건 단순한 우연이 아니라 &lt;b&gt;표본 설계의 실패&lt;/b&gt;예요.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;2. 표본추출의 핵심 원리&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;표본추출(sampling)은 &lt;b&gt;전체(모집단)&lt;/b&gt; 중 일부를 뽑아 &lt;b&gt;대표성 있는 정보&lt;/b&gt;를 얻는 과정입니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;그중에서도 대표성을 지켜주는 세 가지 키워드는 아래와 같아요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;원리&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 설명&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 한 줄 요약&lt;/b&gt;&lt;/p&gt;
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody&gt;
&lt;tr&gt;
&lt;td&gt;&lt;b&gt;무작위성(Randomness)&lt;/b&gt;&lt;/td&gt;
&lt;td&gt;모든 개체가 선택될 &lt;b&gt;동일한 기회&lt;/b&gt;를 가져야 함&lt;/td&gt;
&lt;td&gt;&amp;ldquo;누구든 뽑힐 수 있어야 한다&amp;rdquo;&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;&lt;b&gt;대표성(Representativeness)&lt;/b&gt;&lt;/td&gt;
&lt;td&gt;표본이 모집단의 &lt;b&gt;다양성을 반영&lt;/b&gt;해야 함&lt;/td&gt;
&lt;td&gt;&amp;ldquo;한쪽에 치우치지 말 것&amp;rdquo;&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;&lt;b&gt;충분한 크기(Sample Size)&lt;/b&gt;&lt;/td&gt;
&lt;td&gt;표본이 너무 작으면 &lt;b&gt;변동성&amp;uarr;&lt;/b&gt;&lt;/td&gt;
&lt;td&gt;&amp;ldquo;적어도 수십~수백은 필요하다&amp;rdquo;&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;통계는 이 세 가지를 동시에 만족시키려는 기술이에요.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;3. 표본추출의 3가지 주요 방법&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;1) 단순 무작위 추출(Simple Random Sampling)&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;모집단의 모든 요소가 &lt;b&gt;동일한 확률&lt;/b&gt;로 선택됩니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;가장 기본적인 방식이지만, 현실에선 &lt;b&gt;명단이 완벽&lt;/b&gt;해야 가능해요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;예: 자동차 1만대 중 100대를 무작위로 뽑아 품질 점검.&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;장점 : 계산이 단순하고 편향이 적어요.&lt;br /&gt;단점 : 명단이 완전하지 않으면 의미가 없어요.&lt;/blockquote&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;2) 층화 추출(Stratified Sampling)&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;모집단을 &lt;b&gt;중요한 기준(층, stratum)&lt;/b&gt;에 따라 나눈 뒤, 각 층에서 무작위 추출을 합니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;예: 북미 지역을 '기온대별(한랭, 온난, 열대)'로 나누고 각 지역에서 일정 비율로 표본을 뽑기.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;장점 : 모집단의 다양한 특성을 반영할 수 있어요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;단점 : 층 구분이 잘못되면 오히려 복잡하고 편햘될 수 있어요.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;3) 군집 추출(Cluster Sampling)&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;모집단 전체를 &lt;b&gt;군집(Cluster)&lt;/b&gt;으로 나누고, 일부 군집만 무작위로 선택해 그 안의 모든 개체를 조사합니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;예: 전국 1,000개 딜러 중 50개 딜러만 무작위로 선정해 그 지점의 모든 자동채 데이터를 분석&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;장점 : 비용과 시간이 적게 들어요.&lt;br /&gt;단점 : 군집 간 차이가 클 경우 대표성이 떨어집니다.&lt;/blockquote&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;4. 현실에서의 예&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;&amp;nbsp;상황&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;추천 추출법&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;이유&lt;/b&gt;&lt;/p&gt;
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody&gt;
&lt;tr&gt;
&lt;td&gt;설문조사&lt;/td&gt;
&lt;td&gt;층화 추출&lt;/td&gt;
&lt;td&gt;성별&amp;middot;연령대&amp;middot;지역별 균형 유지&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;생산 품질 점검&lt;/td&gt;
&lt;td&gt;단순 무작위&lt;/td&gt;
&lt;td&gt;공정이 균질한 경우&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;지점별 판매 분석&lt;/td&gt;
&lt;td&gt;군집 추출&lt;/td&gt;
&lt;td&gt;지역 단위로 묶인 경우 효율적&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;5. 샘플 수, 얼마나 뽑아야 할까?&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;표본크기 n이 커질수록 &lt;b&gt;표본평균의 불확실성(표준오차)&lt;/b&gt;은 줄어듭니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;간단한 직관식으로 아래처럼 볼 수 있어요.&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;​&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/p&gt;
&lt;p&gt;&lt;figure class=&quot;imageblock alignLeft&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;170&quot; data-origin-height=&quot;61&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/4QYBq/dJMcajAu8C9/7rSCReeskRO8aNcF9Zxfrk/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/4QYBq/dJMcajAu8C9/7rSCReeskRO8aNcF9Zxfrk/img.png&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/4QYBq/dJMcajAu8C9/7rSCReeskRO8aNcF9Zxfrk/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2F4QYBq%2FdJMcajAu8C9%2F7rSCReeskRO8aNcF9Zxfrk%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;170&quot; height=&quot;61&quot; data-origin-width=&quot;170&quot; data-origin-height=&quot;61&quot;/&gt;&lt;/span&gt;&lt;/figure&gt;
&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;2067&quot; data-start=&quot;2045&quot;&gt;&lt;span&gt;&lt;span aria-hidden=&quot;true&quot;&gt;&lt;span&gt;&lt;span&gt;&amp;sigma;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;: 모집단의 표준편차&lt;/li&gt;
&lt;li data-end=&quot;2085&quot; data-start=&quot;2068&quot;&gt;&lt;span&gt;&lt;span aria-hidden=&quot;true&quot;&gt;&lt;span&gt;&lt;span&gt;n&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;: 표본크기&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;즉, 표본을 4배 늘리면 오차는 절반이 됩니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;다만 표본을 10배 늘린다고 오차가 10배 줄진 않아요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;(루트 때문에 완만하게 줄죠.)&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;  현실 감각&lt;br /&gt;대략 &amp;plusmn;3% 오차를 목표로 하면 n&amp;asymp;1,000 전후,&lt;br /&gt;&amp;plusmn;5% 수준이면 n&amp;asymp;400 정도로 충분한 경우가 많아요.&lt;/blockquote&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;6. 대표성을 해치는 흔한 함정&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;1. 시간 편향 -&lt;/b&gt; 특정 시기만 데이터가 몰림&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;2. 선택 편향&lt;/b&gt; - 스스로 참여한 응답자 위주 (예: 자발적 설문)&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;3. 누락 편향 -&lt;/b&gt; 특정 집단이 명단에 포함되지 않음 (예: 신규 고객 제외)&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;4. 편의 추출(Convenience Sampling) -&lt;/b&gt; &quot;그냥 구하기 쉬운 데이터만 쓰자&quot;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;편의 추출은 &lt;b&gt;가장 위험하지만 현실에서 가장 흔한 방법&lt;/b&gt;이에요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;편하다는 이유로 선택하면, 해석 단계에서 후회할수도..&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;7. 한장 요약&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;개념&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;기억 포인트&lt;/b&gt;&lt;/p&gt;
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody&gt;
&lt;tr&gt;
&lt;td&gt;표본추출의 목적&lt;/td&gt;
&lt;td&gt;전체를 대표하는 일부를 얻기 위해&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;좋은 표본의 조건&lt;/td&gt;
&lt;td&gt;무작위성, 대표성, 충분한 크기&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;주요 방법&lt;/td&gt;
&lt;td&gt;단순 무작위 / 층화 / 군집&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;주의할 점&lt;/td&gt;
&lt;td&gt;편향&amp;middot;누락&amp;middot;시간 효과&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;핵심 공식&lt;/td&gt;
&lt;td&gt;( SE = &amp;sigma; / \sqrt{n} )&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style1&quot;&gt;&lt;span style=&quot;font-family: 'Noto Serif KR';&quot;&gt;&quot;좋은 데이터는 계산보다 설계에서 만들어진다.&quot;&lt;/span&gt;&lt;/blockquote&gt;</description>
      <category>Statistics/기초 통계</category>
      <category>군집</category>
      <category>기초통계학</category>
      <category>누락</category>
      <category>대표성</category>
      <category>데이터분석</category>
      <category>데이터사이언스</category>
      <category>샘플링</category>
      <category>층화추출</category>
      <category>편향</category>
      <category>표본추출</category>
      <author>Allen93</author>
      <guid isPermaLink="true">https://allensdatablog.tistory.com/446</guid>
      <comments>https://allensdatablog.tistory.com/entry/3-%ED%91%9C%EB%B3%B8%EC%B6%94%EC%B6%9C%EC%9D%98-%EA%B8%B0%EB%B3%B8-%EC%A2%8B%EC%9D%80-%EB%8D%B0%EC%9D%B4%ED%84%B0%EB%8A%94-%EA%B7%B8%EB%83%A5-%EB%A7%8C%EB%93%A4%EC%96%B4%EC%A7%80%EC%A7%80-%EC%95%8A%EC%95%84%EC%9A%94#entry446comment</comments>
      <pubDate>Thu, 30 Oct 2025 12:37:29 +0900</pubDate>
    </item>
    <item>
      <title>2. 모집단과 표본 - 통계는 '전체'를 어떻게 상상하나</title>
      <link>https://allensdatablog.tistory.com/entry/%EB%AA%A8%EC%A7%91%EB%8B%A8%EA%B3%BC-%ED%91%9C%EB%B3%B8-%ED%86%B5%EA%B3%84%EB%8A%94-%EC%A0%84%EC%B2%B4%EB%A5%BC-%EC%96%B4%EB%96%BB%EA%B2%8C-%EC%83%81%EC%83%81%ED%95%98%EB%82%98</link>
      <description>&lt;p&gt;&lt;figure class=&quot;imageblock alignCenter&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;1024&quot; data-origin-height=&quot;1024&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/bfbrak/dJMb82r9j6w/SXyRkTdo73PfY5KnSAuIVK/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/bfbrak/dJMb82r9j6w/SXyRkTdo73PfY5KnSAuIVK/img.png&quot; data-alt=&quot;모집단과 표본&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/bfbrak/dJMb82r9j6w/SXyRkTdo73PfY5KnSAuIVK/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2Fbfbrak%2FdJMb82r9j6w%2FSXyRkTdo73PfY5KnSAuIVK%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;569&quot; height=&quot;569&quot; data-origin-width=&quot;1024&quot; data-origin-height=&quot;1024&quot;/&gt;&lt;/span&gt;&lt;figcaption&gt;모집단과 표본&lt;/figcaption&gt;
&lt;/figure&gt;
&lt;/p&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;&amp;nbsp;&lt;/h3&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;1. 왜 이걸 먼저 이해해야 할까&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;우리가 보는 데이터는 대부분 &lt;b&gt;전체(모집단)&lt;/b&gt;가 아니라 &lt;b&gt;일부(표본)&lt;/b&gt;예요. 설문 1,000명, 생산라인 하루치, A/B 실험의 2주치... 전부 &lt;b&gt;표본&lt;/b&gt;이죠. 통계는 이 표본으로 보이지 않는 &lt;b&gt;전체&lt;/b&gt;를 추정하려는 시도에요. 그래서 &quot;표본이 얼마나 '대표'인지&quot;를 끊임없이 따집니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;2. 핵심 정의 한줄&amp;nbsp;&lt;/h3&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;&lt;b&gt;모집단(population)&lt;/b&gt; : 우리가 알고 싶은 &lt;b&gt;전체&lt;/b&gt;. 예) 현대 자동차 전량의 고장률.&lt;/li&gt;
&lt;li&gt;&lt;b&gt;표본(Sample)&lt;/b&gt; : 실제로 관측한 일부. 예) 2025년 6~10월 수리 접수된 1,200건.&lt;/li&gt;
&lt;li&gt;&lt;b&gt;모수(parameter)&lt;/b&gt; : 모집단의 진짜 값(정답). 예) 전체 고장률 p.&lt;/li&gt;
&lt;li&gt;&lt;b&gt;통계량(statisic)&lt;/b&gt; : 표본으로 계산한 값(추정치). 예) 표본 고장률 &lt;span&gt;&lt;span aria-hidden=&quot;true&quot;&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;p&lt;/span&gt;&lt;/span&gt;&lt;span&gt;&lt;span&gt;&lt;span&gt;^&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span&gt;​&lt;/span&gt;&lt;/span&gt;&lt;span&gt;&lt;span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;.&lt;/li&gt;
&lt;/ul&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;기억 포인트 : 우리는 모수를 모르기 때문에 통계량으로 추정합니다.&lt;/blockquote&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;3. 직감으로 보는 '대표성'&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;표본이 대표적이지 않으면, 그 어떤 멋진 모델도 불안정할 수 있어요.&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;&lt;b&gt;편향(bias)&lt;/b&gt; : 특정 조건에 치우쳐 뽑힘. (주말만 뽑아 근무패턴 왜곡)&lt;/li&gt;
&lt;li&gt;&lt;b&gt;변동성(variance) :&lt;/b&gt; 운에 따라 표본 값이 불안정함. (표번이 너무 작으면 불안정)&lt;/li&gt;
&lt;li&gt;&lt;b&gt;표본크기(n)&lt;/b&gt; : 대체로 클수록 안정.&amp;nbsp;&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;4. 현실 예시 3가지&lt;/h3&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;1. 품질 데이터&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;2% 불량률을 추정하려면, 생산 초반 하루치(특수상황)만 보지 말고 여러 날, 라인을 섞어 뽑아야 해요. 그래야 라인/날짜 효과가 평균화되어 대표성이 살아납니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;2. A/B 테스트&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;신규 UI가 전환율을 올렸는지 보려면, 유입 채널, 시간대, 디바이스가 균형되게 표본이 배정되어야 해요. 한쪽에 모바일만 몰리면 표본이 기울죠.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;3. 설문조사&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;만족도 조사에 &quot;자발적으로&quot; 응한 사람만 모이면 극단 의견이 과대표집돼요. 이게 자기선택편향. 무작위표집이 괜히 강조되는 게 아닙니다.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;5. 흔한 오해 바로잡기&lt;/h3&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;&quot;표본이 크면 무조건 정답에 가깝다?&quot; -&amp;gt; &lt;b&gt;대표성&lt;/b&gt;이 먼저예요. 큰 표본이라도 한쪽으로 치우치면 크게 틀릴 수 있어요.&lt;/li&gt;
&lt;li&gt;&quot;표본 평균 = 모집단의 평균?&quot; -&amp;gt; 표본 평균은 &lt;b&gt;추정치&lt;/b&gt;예요. 항상 &lt;b&gt;오차&lt;/b&gt;가 붙습니다. 그래서 신뢰구간을 같이 말해 줘야 해요.&lt;/li&gt;
&lt;li&gt;&quot;과거 데이터로 충분하다?&quot; -&amp;gt; 공정이 바뀌거나 고객 구성이 달라지면, 그 표본은 더 이상 현재의 모집단을 대표하지 않아요. 시간축 편향 주의.&lt;/li&gt;
&lt;li&gt;&amp;nbsp;&lt;figure class=&quot;imageblock alignCenter&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;1024&quot; data-origin-height=&quot;1024&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/clKTUz/dJMb9MbQwF3/pd1ZVUUyDYMmxAgsjuURgK/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/clKTUz/dJMb9MbQwF3/pd1ZVUUyDYMmxAgsjuURgK/img.png&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/clKTUz/dJMb9MbQwF3/pd1ZVUUyDYMmxAgsjuURgK/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2FclKTUz%2FdJMb9MbQwF3%2Fpd1ZVUUyDYMmxAgsjuURgK%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;594&quot; height=&quot;594&quot; data-origin-width=&quot;1024&quot; data-origin-height=&quot;1024&quot;/&gt;&lt;/span&gt;&lt;/figure&gt;
&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;6. 실무 팁&lt;/h3&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;&lt;b&gt;표본 프레임&lt;/b&gt;부터 의심하기 : 표본을 뽑아오는 &lt;b&gt;원천 리스트&lt;/b&gt;가 전체를 제대로 덮고 있는지 먼저 점검&lt;/li&gt;
&lt;li&gt;&lt;b&gt;층화추출&lt;/b&gt; 가볍게라도 : 라인/지역/채널 등 중요한 축으로 쪼개 &lt;b&gt;각 층에서 무작위&lt;/b&gt;로 뽑으면, 같은 n으로도 더 안정적.&lt;/li&gt;
&lt;li&gt;&lt;b&gt;n 감각 챙기기&lt;/b&gt; : 대략적으로 &quot;비율 p를 +-3% 정도로 보고 싶다&quot;면 n ~~ 1,000 이 자주 등장해요(러프한 감). 처음 설계 단계에서 목표 오차 -&amp;gt; 필요 n을 대충이라도 계산해두면 쓸데없는 실험 반복이 줄어요.&lt;/li&gt;
&lt;li&gt;&lt;b&gt;샘플 변동 확인&lt;/b&gt; : 표본을 여러 번 뽑았을 떄 값이 얼마나 흔들릴지&lt;b&gt; 부트스트랩&lt;/b&gt;으로 감 잡아보면 설득력이 확 올라갑니다.&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;h3 data-ke-size=&quot;size23&quot;&gt;7. 한 장 요약&lt;/h3&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;통계는 &lt;b&gt;표본 -&amp;gt; 모집단&lt;/b&gt;으로의 점프를 관리하는 기술.&lt;/li&gt;
&lt;li&gt;핵심은 &lt;b&gt;대표성, 편향, 변동성, 표본크기&lt;/b&gt; 네 축.&lt;/li&gt;
&lt;li&gt;&quot;큰 표본&quot;보다 &quot;제대로 뽑힌 표본&quot;이 먼저.&lt;/li&gt;
&lt;li&gt;오차는 자연스러워요. &lt;b&gt;오차를 인정하고 관리&lt;/b&gt;하는 훨씬 효율적이에요.&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;</description>
      <category>Statistics/기초 통계</category>
      <category>기초통계학</category>
      <category>대표성</category>
      <category>데이터분석</category>
      <category>데이터사이언스</category>
      <category>모집단과표본</category>
      <category>통계</category>
      <category>표본추출</category>
      <author>Allen93</author>
      <guid isPermaLink="true">https://allensdatablog.tistory.com/445</guid>
      <comments>https://allensdatablog.tistory.com/entry/%EB%AA%A8%EC%A7%91%EB%8B%A8%EA%B3%BC-%ED%91%9C%EB%B3%B8-%ED%86%B5%EA%B3%84%EB%8A%94-%EC%A0%84%EC%B2%B4%EB%A5%BC-%EC%96%B4%EB%96%BB%EA%B2%8C-%EC%83%81%EC%83%81%ED%95%98%EB%82%98#entry445comment</comments>
      <pubDate>Mon, 27 Oct 2025 08:43:47 +0900</pubDate>
    </item>
    <item>
      <title>1. 통계학은 숫자를 다루는 학문이 아니에요</title>
      <link>https://allensdatablog.tistory.com/entry/1-%ED%86%B5%EA%B3%84%ED%95%99%EC%9D%80-%EC%88%AB%EC%9E%90%EB%A5%BC-%EB%8B%A4%EB%A3%A8%EB%8A%94-%ED%95%99%EB%AC%B8%EC%9D%B4-%EC%95%84%EB%8B%88%EC%97%90%EC%9A%94</link>
      <description>&lt;blockquote data-ke-style=&quot;style1&quot;&gt;&lt;span style=&quot;font-family: 'Noto Serif KR';&quot;&gt;- 데이터 사이언스의 언어, 그 시작점&lt;/span&gt;&lt;/blockquote&gt;
&lt;p&gt;&lt;figure class=&quot;imageblock alignCenter&quot; data-ke-mobileStyle=&quot;widthOrigin&quot; data-origin-width=&quot;1024&quot; data-origin-height=&quot;1024&quot;&gt;&lt;span data-url=&quot;https://blog.kakaocdn.net/dn/mtG8Z/dJMb85bkCcE/oxA5dE99kZQ9uHMvgoDUe0/img.png&quot; data-phocus=&quot;https://blog.kakaocdn.net/dn/mtG8Z/dJMb85bkCcE/oxA5dE99kZQ9uHMvgoDUe0/img.png&quot;&gt;&lt;img src=&quot;https://blog.kakaocdn.net/dn/mtG8Z/dJMb85bkCcE/oxA5dE99kZQ9uHMvgoDUe0/img.png&quot; srcset=&quot;https://img1.daumcdn.net/thumb/R1280x0/?scode=mtistory2&amp;fname=https%3A%2F%2Fblog.kakaocdn.net%2Fdn%2FmtG8Z%2FdJMb85bkCcE%2FoxA5dE99kZQ9uHMvgoDUe0%2Fimg.png&quot; onerror=&quot;this.onerror=null; this.src='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png'; this.srcset='//t1.daumcdn.net/tistory_admin/static/images/no-image-v1.png';&quot; loading=&quot;lazy&quot; width=&quot;554&quot; height=&quot;554&quot; data-origin-width=&quot;1024&quot; data-origin-height=&quot;1024&quot;/&gt;&lt;/span&gt;&lt;/figure&gt;
&lt;/p&gt;
&lt;h2 data-ke-size=&quot;size26&quot;&gt;1. &quot;오늘 비 올 확률이 70%래요&quot;&lt;/h2&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;&quot;오늘 강수 확률은 70%입니다.&quot;&lt;/blockquote&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이 말을 듣고 어떤 사람은 우산을 챙기고,&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;또 어떤 사람은 &quot;30%면 안 올 수도 있겠네?&quot; 하며 그냥 나가죠.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;재미있는 건,&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;비가 오느냐 안오느냐보다 &lt;b&gt;사람마다 '확률'을 해석하는 방식이 다르다는 점&lt;/b&gt;이에요&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;누군가는 조심성을 택하고,&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;누군가는 낙관을 택하죠.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이게 바로 통계의 출발점이에요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;불확실한 세상에서 어떻게 판달할 것인가.&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;통계학은 완벽한 정답을 알려주는 학문이 아니에요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;대신 &quot;틀릴 수도 있는 상황에서, 그래도 제일 합리적인 선택&quot;을 돕는 학문이라 생각해요.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h2 data-ke-size=&quot;size26&quot;&gt;&lt;span style=&quot;font-family: 'Noto Serif KR';&quot;&gt;2. 통계의 본질은 '의사결정의 언어'예요&lt;/span&gt;&lt;/h2&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;span style=&quot;font-family: AppleSDGothicNeo-Regular, 'Malgun Gothic', '맑은 고딕', dotum, 돋움, sans-serif;&quot;&gt;&lt;span&gt;통계라고 하면 보통 '숫자 계산', '그래프', '평균' 을 떠올리죠.&lt;/span&gt;&lt;/span&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;span style=&quot;font-family: AppleSDGothicNeo-Regular, 'Malgun Gothic', '맑은 고딕', dotum, 돋움, sans-serif;&quot;&gt;&lt;span&gt;물론 이 말이 틀린건 아닌데요,&lt;/span&gt;&lt;/span&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;span style=&quot;font-family: AppleSDGothicNeo-Regular, 'Malgun Gothic', '맑은 고딕', dotum, 돋움, sans-serif;&quot;&gt;&lt;span&gt;하지만 통계의 진짜 핵심은&lt;b&gt; 숫자가 아니라 사고방식&lt;/b&gt;이라 생각합니다.&lt;/span&gt;&lt;/span&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;구분&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;의미&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;예시&lt;/b&gt;&lt;/p&gt;
&lt;table style=&quot;border-collapse: collapse; width: 100%;&quot; border=&quot;1&quot; data-ke-align=&quot;alignLeft&quot;&gt;
&lt;tbody&gt;
&lt;tr&gt;
&lt;td&gt;&lt;b&gt;기술통계 (Descriptive Statistics)&lt;/b&gt;&lt;/td&gt;
&lt;td&gt;이미 가지고 있는 데이터를 요약하고 정리&lt;/td&gt;
&lt;td&gt;평균, 중앙값, 표준편차, 그래프&lt;/td&gt;
&lt;/tr&gt;
&lt;tr&gt;
&lt;td&gt;&lt;b&gt;추론통계 (Inferential Statistics)&lt;/b&gt;&lt;/td&gt;
&lt;td&gt;일부 데이터를 통해 전체를 추정하고 판단&lt;/td&gt;
&lt;td&gt;가설검정, 신뢰구간, 회귀분석&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;
&lt;/table&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;통계는 늘 이렇게 물어요&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;&quot;이 데이터가 세상을 얼마나 잘 대표하고 있을까?&quot;&lt;/blockquote&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;span style=&quot;font-family: AppleSDGothicNeo-Regular, 'Malgun Gothic', '맑은 고딕', dotum, 돋움, sans-serif;&quot;&gt;&lt;span&gt;결국 통계는 &lt;b&gt;보이는 일부를 가지고 보이지 않는 전체를 상상하는 기술&lt;/b&gt;이에요.&lt;/span&gt;&lt;/span&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;span style=&quot;font-family: AppleSDGothicNeo-Regular, 'Malgun Gothic', '맑은 고딕', dotum, 돋움, sans-serif;&quot;&gt;&lt;span&gt;데이터를 보는 눈이자, 세상을 읽는 감각이기도 하죠.&lt;/span&gt;&lt;/span&gt;&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h2 data-ke-size=&quot;size26&quot;&gt;&lt;span&gt;3. 평균 하나로는 부족해요&lt;/span&gt;&lt;/h2&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;span style=&quot;font-family: AppleSDGothicNeo-Regular, 'Malgun Gothic', '맑은 고딕', dotum, 돋움, sans-serif;&quot;&gt;&lt;span&gt;예를 들어서, &lt;/span&gt;&lt;/span&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;span style=&quot;font-family: AppleSDGothicNeo-Regular, 'Malgun Gothic', '맑은 고딕', dotum, 돋움, sans-serif;&quot;&gt;&lt;span&gt;A공장과 B공장 두 곳의 불량이 모두 2%라고 칩시다.&lt;/span&gt;&lt;/span&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;span style=&quot;font-family: AppleSDGothicNeo-Regular, 'Malgun Gothic', '맑은 고딕', dotum, 돋움, sans-serif;&quot;&gt;&lt;span&gt;숫자만 보면 똑같아 보이죠?&lt;/span&gt;&lt;/span&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;span style=&quot;font-family: AppleSDGothicNeo-Regular, 'Malgun Gothic', '맑은 고딕', dotum, 돋움, sans-serif;&quot;&gt;&lt;span&gt;그런데 자세히 보면,&lt;/span&gt;&lt;/span&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;span style=&quot;font-family: AppleSDGothicNeo-Regular, 'Malgun Gothic', '맑은 고딕', dotum, 돋움, sans-serif;&quot;&gt;&lt;span&gt;A공장은 매일 꾸준히 불량이 2%씩 나고,&lt;/span&gt;&lt;/span&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;span style=&quot;font-family: AppleSDGothicNeo-Regular, 'Malgun Gothic', '맑은 고딕', dotum, 돋움, sans-serif;&quot;&gt;&lt;span&gt;B공장은 대부분 멀쩡하다가 특정 시기에만 불량이 몰려요.&lt;/span&gt;&lt;/span&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;span style=&quot;font-family: AppleSDGothicNeo-Regular, 'Malgun Gothic', '맑은 고딕', dotum, 돋움, sans-serif;&quot;&gt;&lt;span&gt;두 공장의 평균은 같지만,&lt;/span&gt;&lt;/span&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;span style=&quot;font-family: AppleSDGothicNeo-Regular, 'Malgun Gothic', '맑은 고딕', dotum, 돋움, sans-serif;&quot;&gt;&lt;span&gt;그 안의 내용은 완전 다르죠?&lt;/span&gt;&lt;/span&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;span style=&quot;font-family: AppleSDGothicNeo-Regular, 'Malgun Gothic', '맑은 고딕', dotum, 돋움, sans-serif;&quot;&gt;&lt;span&gt;이게 바로 통계의 핵심이에요.&lt;/span&gt;&lt;/span&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;&lt;span style=&quot;font-family: AppleSDGothicNeo-Regular, 'Malgun Gothic', '맑은 고딕', dotum, 돋움, sans-serif;&quot;&gt;&lt;span&gt;숫자 하나로는 현상을 다 담을 수 없다.&lt;/span&gt;&lt;/span&gt;&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;그래서 우리는 평균만 보지 않고 &lt;b&gt;분산, 표준편차, 분포&lt;/b&gt;를 함께 봐야 돼요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;숫자는 사실을 요약하지만,&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;그 과정에서 중요한 정보가 빠지기도 하거든요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;통계는 숫자를 그대로 믿지 않고,&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;숫자가 만들어진 과정&lt;/b&gt;을 보는 학문이에요.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h2 data-ke-size=&quot;size26&quot;&gt;&lt;span style=&quot;font-family: AppleSDGothicNeo-Regular, 'Malgun Gothic', '맑은 고딕', dotum, 돋움, sans-serif;&quot;&gt;&lt;span&gt;4. 통계는 '데이터의 언어'예요&lt;/span&gt;&lt;/span&gt;&lt;/h2&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;span style=&quot;font-family: AppleSDGothicNeo-Regular, 'Malgun Gothic', '맑은 고딕', dotum, 돋움, sans-serif;&quot;&gt;&lt;span&gt;통계는 기술이 아니라 언어예요.&lt;/span&gt;&lt;/span&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;span style=&quot;font-family: AppleSDGothicNeo-Regular, 'Malgun Gothic', '맑은 고딕', dotum, 돋움, sans-serif;&quot;&gt;&lt;span&gt;데이터를 읽고, 해석하고, 설득하기 위한 언어 말이죠&lt;/span&gt;&lt;/span&gt;&lt;/p&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li&gt;엔지니어에게는 품질을 설명하는 언어&lt;/li&gt;
&lt;li&gt;마케터에게는 소비자를 이해하는 언어&lt;/li&gt;
&lt;li&gt;연구자에게는 가설을 검증하는 언어가 됩니다&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;예를 들어 자동차의 센서 데이터를 본다고 해볼까요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;특정 부품의 온도가 갑자기 튀면, 그건 단순한 숫자 이상이에요.&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;&quot;이상 현상이 통계적으로 유의한가?&quot;&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;b&gt;&quot;이 현상이 반복될 확률은 얼마나 될까?&quot;&lt;/b&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;이런 질문들이 바로 통계의 언어로 번역되는 순간이라 생각합니다.&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;h2 data-ke-size=&quot;size26&quot;&gt;&lt;span style=&quot;font-family: AppleSDGothicNeo-Regular, 'Malgun Gothic', '맑은 고딕', dotum, 돋움, sans-serif;&quot;&gt;&lt;span&gt;5. 불확실성을 다루는 용기&lt;/span&gt;&lt;/span&gt;&lt;/h2&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;span style=&quot;font-family: AppleSDGothicNeo-Regular, 'Malgun Gothic', '맑은 고딕', dotum, 돋움, sans-serif;&quot;&gt;&lt;span&gt;처음 통계를 배우면 좀 답답할 수 있어요.&lt;/span&gt;&lt;/span&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;span style=&quot;font-family: AppleSDGothicNeo-Regular, 'Malgun Gothic', '맑은 고딕', dotum, 돋움, sans-serif;&quot;&gt;&lt;span&gt;&quot;왜 이렇게 복잡하게 돌아가는거야?&quot; 싶은데요&lt;/span&gt;&lt;/span&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;span style=&quot;font-family: AppleSDGothicNeo-Regular, 'Malgun Gothic', '맑은 고딕', dotum, 돋움, sans-serif;&quot;&gt;&lt;span&gt;하지만 통계는 세상의 불확실함을 없애려 하지 않아요.&lt;/span&gt;&lt;/span&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;span style=&quot;font-family: AppleSDGothicNeo-Regular, 'Malgun Gothic', '맑은 고딕', dotum, 돋움, sans-serif;&quot;&gt;&lt;span&gt;오히려 그걸 &lt;b&gt;인정하고 수치로 다루는 법&lt;/b&gt;을 가르쳐줍니다.&lt;/span&gt;&lt;/span&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;span style=&quot;font-family: AppleSDGothicNeo-Regular, 'Malgun Gothic', '맑은 고딕', dotum, 돋움, sans-serif;&quot;&gt;&lt;span&gt;완벽한 설명은 없어요.&lt;/span&gt;&lt;/span&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;span style=&quot;font-family: AppleSDGothicNeo-Regular, 'Malgun Gothic', '맑은 고딕', dotum, 돋움, sans-serif;&quot;&gt;&lt;span&gt;다만, 조금 더 나은 해석이 있을 뿐이죠.&lt;/span&gt;&lt;/span&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;span style=&quot;font-family: AppleSDGothicNeo-Regular, 'Malgun Gothic', '맑은 고딕', dotum, 돋움, sans-serif;&quot;&gt;&lt;span&gt;그래서 통계를 공부하면 숫자를 믿기보다, &lt;b&gt;숫자를 의심하는 눈&lt;/b&gt;이 생깁니다.&lt;/span&gt;&lt;/span&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;blockquote data-ke-style=&quot;style2&quot;&gt;통계는 숫자를 믿는 학문이 아니라, 숫자를 의심하는 법을 배우는 학문이라 생각해요&lt;/blockquote&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;hr contenteditable=&quot;false&quot; data-ke-type=&quot;horizontalRule&quot; data-ke-style=&quot;style6&quot; /&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&lt;span style=&quot;font-family: AppleSDGothicNeo-Regular, 'Malgun Gothic', '맑은 고딕', dotum, 돋움, sans-serif;&quot;&gt;&lt;span&gt;이제부터 이 기초통계 시리즈에서는 그 '의심의 기술'을 하나씩 익혀가 봅시다  &lt;/span&gt;&lt;/span&gt;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;
&lt;p data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;</description>
      <category>Statistics/기초 통계</category>
      <category>Statistics</category>
      <category>기초통계</category>
      <category>데이터분석</category>
      <category>데이터사이언스</category>
      <category>비전공</category>
      <category>통계입문</category>
      <author>Allen93</author>
      <guid isPermaLink="true">https://allensdatablog.tistory.com/444</guid>
      <comments>https://allensdatablog.tistory.com/entry/1-%ED%86%B5%EA%B3%84%ED%95%99%EC%9D%80-%EC%88%AB%EC%9E%90%EB%A5%BC-%EB%8B%A4%EB%A3%A8%EB%8A%94-%ED%95%99%EB%AC%B8%EC%9D%B4-%EC%95%84%EB%8B%88%EC%97%90%EC%9A%94#entry444comment</comments>
      <pubDate>Fri, 24 Oct 2025 10:23:56 +0900</pubDate>
    </item>
    <item>
      <title>⚡ Power FX 실전 &amp;mdash; 예약 실행(스케줄러)와 반복 작업 자동화</title>
      <link>https://allensdatablog.tistory.com/entry/%E2%9A%A1-Power-FX-%EC%8B%A4%EC%A0%84-%E2%80%94-%EC%98%88%EC%95%BD-%EC%8B%A4%ED%96%89%EC%8A%A4%EC%BC%80%EC%A4%84%EB%9F%AC%EC%99%80-%EB%B0%98%EB%B3%B5-%EC%9E%91%EC%97%85-%EC%9E%90%EB%8F%99%ED%99%94</link>
      <description>&lt;blockquote data-end=&quot;199&quot; data-start=&quot;42&quot; data-ke-style=&quot;style1&quot;&gt;&lt;span style=&quot;font-family: 'Noto Serif KR';&quot;&gt;이번 포스트에선 Power Apps와 Power Automate를 활용해&lt;/span&gt;&lt;br /&gt;&lt;span style=&quot;font-family: 'Noto Serif KR';&quot;&gt;예약 실행(스케줄러), 반복 업무 자동화, 정기 알림 기능을 구현하는 방법을 소개합니다.&lt;/span&gt;&lt;br /&gt;&lt;span style=&quot;font-family: 'Noto Serif KR';&quot;&gt;매일/매주 자동 리포트 발송, 정기 데이터 업데이트, 자동 백업 등 실무 자동화에 바로 쓸 수 있습니다.&lt;/span&gt;&lt;/blockquote&gt;
&lt;hr data-end=&quot;204&quot; data-start=&quot;201&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;244&quot; data-start=&quot;206&quot; data-ke-size=&quot;size26&quot;&gt; ️ Power Automate로 예약 흐름(Flow) 만들기&lt;/h2&gt;
&lt;h3 data-end=&quot;272&quot; data-start=&quot;246&quot; data-ke-size=&quot;size23&quot;&gt;1) &lt;b&gt;예약 트리거(flow) 생성&lt;/b&gt;&lt;/h3&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;380&quot; data-start=&quot;273&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;321&quot; data-start=&quot;273&quot;&gt;Power Automate에서 &lt;b&gt;&amp;lsquo;일정&amp;rsquo;(Recurrence) 트리거&lt;/b&gt; 선택&lt;/li&gt;
&lt;li data-end=&quot;380&quot; data-start=&quot;322&quot;&gt;실행 주기(분/시간/일/주/월) 자유롭게 지정
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;380&quot; data-start=&quot;354&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;380&quot; data-start=&quot;354&quot;&gt;예) 매일 오전 9시, 매주 월요일 8시 등&lt;/li&gt;
&lt;/ul&gt;
&lt;/li&gt;
&lt;/ul&gt;
&lt;hr data-end=&quot;385&quot; data-start=&quot;382&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h3 data-end=&quot;417&quot; data-start=&quot;387&quot; data-ke-size=&quot;size23&quot;&gt;&lt;span style=&quot;font-family: 'Noto Serif KR';&quot;&gt;2) &lt;b&gt;흐름(Flow)에서 자동 작업 추가&lt;/b&gt;&lt;/span&gt;&lt;/h3&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;534&quot; data-start=&quot;418&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;462&quot; data-start=&quot;418&quot;&gt;&lt;span style=&quot;font-family: 'Noto Serif KR';&quot;&gt;SharePoint, Dataverse, Excel 등 데이터 읽기/쓰기&lt;/span&gt;&lt;/li&gt;
&lt;li data-end=&quot;501&quot; data-start=&quot;463&quot;&gt;&lt;span style=&quot;font-family: 'Noto Serif KR';&quot;&gt;메일 발송, Teams/Slack 알림, 외부 API 호출 등&lt;/span&gt;&lt;/li&gt;
&lt;li data-end=&quot;534&quot; data-start=&quot;502&quot;&gt;&lt;span style=&quot;font-family: 'Noto Serif KR';&quot;&gt;예: &lt;b&gt;매일 결재 대기자에게 알림 메일 자동 발송&lt;/b&gt;&lt;/span&gt;&lt;/li&gt;
&lt;/ul&gt;
&lt;hr data-end=&quot;539&quot; data-start=&quot;536&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h3 data-end=&quot;573&quot; data-start=&quot;541&quot; data-ke-size=&quot;size23&quot;&gt;3) &lt;b&gt;Power Apps와 연계한 예약 실행&lt;/b&gt;&lt;/h3&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;651&quot; data-start=&quot;574&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;620&quot; data-start=&quot;574&quot;&gt;예약 흐름에서 특정 데이터를 Power Apps 데이터 소스에 업데이트/삽입&lt;/li&gt;
&lt;li data-end=&quot;651&quot; data-start=&quot;621&quot;&gt;예약 알림/업무 로그를 앱 내에서 실시간 조회 가능&lt;/li&gt;
&lt;/ul&gt;
&lt;hr data-end=&quot;656&quot; data-start=&quot;653&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;686&quot; data-start=&quot;658&quot; data-ke-size=&quot;size26&quot;&gt; ️ 반복 작업 자동화(정기적 데이터 처리)&lt;/h2&gt;
&lt;h3 data-end=&quot;711&quot; data-start=&quot;688&quot; data-ke-size=&quot;size23&quot;&gt;1) &lt;b&gt;정기 백업/데이터 이전&lt;/b&gt;&lt;/h3&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;750&quot; data-start=&quot;712&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;750&quot; data-start=&quot;712&quot;&gt;예: SharePoint &amp;rarr; Excel, 데이터 일괄 복사, 보관&lt;/li&gt;
&lt;/ul&gt;
&lt;h3 data-end=&quot;778&quot; data-start=&quot;752&quot; data-ke-size=&quot;size23&quot;&gt;2) &lt;b&gt;정기 리포트/통계 자동 전송&lt;/b&gt;&lt;/h3&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;856&quot; data-start=&quot;779&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;856&quot; data-start=&quot;779&quot;&gt;예: 매주 매출 요약, 누적 실적, 프로젝트 현황 등&lt;br /&gt;Power Automate로 PDF/Excel 리포트 자동 생성 &amp;amp; 메일 발송&lt;/li&gt;
&lt;/ul&gt;
&lt;hr data-end=&quot;861&quot; data-start=&quot;858&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;885&quot; data-start=&quot;863&quot; data-ke-size=&quot;size26&quot;&gt; ️ 예약 알림과 사용자 인터랙션&lt;/h2&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;1002&quot; data-start=&quot;887&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;960&quot; data-start=&quot;887&quot;&gt;매일/매주/월 등 주기적 일정 도래 시&lt;br /&gt;Power Apps의 Notify/배너/Push 알림 등과 연동해 사용자에게 안내&lt;/li&gt;
&lt;li data-end=&quot;1002&quot; data-start=&quot;961&quot;&gt;앱 내 대시보드에 오늘 할 일, 마감 일정, 신규 메시지 등 자동 표시&lt;/li&gt;
&lt;/ul&gt;
&lt;hr data-end=&quot;1007&quot; data-start=&quot;1004&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h3 data-end=&quot;1021&quot; data-start=&quot;1009&quot; data-ke-size=&quot;size23&quot;&gt;함수/속성 설명&lt;/h3&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;1195&quot; data-start=&quot;1023&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;1076&quot; data-start=&quot;1023&quot;&gt;&lt;b&gt;Power Automate(흐름)&lt;/b&gt; : 예약 트리거, 반복 작업, 알림 자동화 등 담당&lt;/li&gt;
&lt;li data-end=&quot;1110&quot; data-start=&quot;1077&quot;&gt;&lt;b&gt;Recurrence&lt;/b&gt; : 반복(스케줄) 트리거 설정&lt;/li&gt;
&lt;li data-end=&quot;1152&quot; data-start=&quot;1111&quot;&gt;&lt;b&gt;Power Apps 데이터 소스&lt;/b&gt; : 흐름에서 읽기/쓰기/업데이트&lt;/li&gt;
&lt;li data-end=&quot;1195&quot; data-start=&quot;1153&quot;&gt;&lt;b&gt;Notify, Patch 등&lt;/b&gt; : 앱 내 실시간 알림, 데이터 반영&lt;/li&gt;
&lt;/ul&gt;
&lt;hr data-end=&quot;1200&quot; data-start=&quot;1197&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;1213&quot; data-start=&quot;1202&quot; data-ke-size=&quot;size26&quot;&gt;실무 활용 예시&lt;/h2&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;1295&quot; data-start=&quot;1215&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;1237&quot; data-start=&quot;1215&quot;&gt;매주 업무 보고서 자동 발송 및 저장&lt;/li&gt;
&lt;li data-end=&quot;1272&quot; data-start=&quot;1238&quot;&gt;프로젝트 마감일 도래 시 자동 알림 및 담당자 메시지 전송&lt;/li&gt;
&lt;li data-end=&quot;1295&quot; data-start=&quot;1273&quot;&gt;주기적 데이터 정리/이관, 이력 관리&lt;/li&gt;
&lt;/ul&gt;
&lt;hr data-end=&quot;1300&quot; data-start=&quot;1297&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;1309&quot; data-start=&quot;1302&quot; data-ke-size=&quot;size26&quot;&gt;실무 팁&lt;/h2&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;1433&quot; data-start=&quot;1311&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;1346&quot; data-start=&quot;1311&quot;&gt;예약 실행 주기/시간대는 팀 업무 패턴에 맞게 유연하게 조정&lt;/li&gt;
&lt;li data-end=&quot;1381&quot; data-start=&quot;1347&quot;&gt;자동화 흐름에 실패/예외 처리(알림, 재시도 등) 꼭 추가&lt;/li&gt;
&lt;li data-end=&quot;1433&quot; data-start=&quot;1382&quot;&gt;예약 흐름 결과는 앱 내 컬렉션/로그에 기록해&lt;br /&gt;관리자 모니터링/감사 용도로 활용 가능&lt;/li&gt;
&lt;/ul&gt;
&lt;hr data-end=&quot;1438&quot; data-start=&quot;1435&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;1446&quot; data-start=&quot;1440&quot; data-ke-size=&quot;size26&quot;&gt;마무리&lt;/h2&gt;
&lt;p data-end=&quot;1569&quot; data-start=&quot;1448&quot; data-ke-size=&quot;size16&quot;&gt;Power Automate의 예약 실행(스케줄러) 기능을 활용하면&lt;br /&gt;Power Apps 앱을 더욱 자동화되고 체계적으로 운영할 수 있습니다.&lt;br /&gt;반복 업무를 줄이고, 실시간 정보 전달&amp;middot;데이터 품질까지 함께 잡으세요.&lt;/p&gt;</description>
      <category>Programming/Power Apps(PowerFx)</category>
      <category>powerapps</category>
      <category>Powerautomate</category>
      <category>powerfx</category>
      <category>스케줄러</category>
      <category>앱개발</category>
      <category>예약실행</category>
      <category>자동화</category>
      <author>Allen93</author>
      <guid isPermaLink="true">https://allensdatablog.tistory.com/443</guid>
      <comments>https://allensdatablog.tistory.com/entry/%E2%9A%A1-Power-FX-%EC%8B%A4%EC%A0%84-%E2%80%94-%EC%98%88%EC%95%BD-%EC%8B%A4%ED%96%89%EC%8A%A4%EC%BC%80%EC%A4%84%EB%9F%AC%EC%99%80-%EB%B0%98%EB%B3%B5-%EC%9E%91%EC%97%85-%EC%9E%90%EB%8F%99%ED%99%94#entry443comment</comments>
      <pubDate>Sun, 28 Sep 2025 10:20:10 +0900</pubDate>
    </item>
    <item>
      <title>⚡ Power FX 실전 &amp;mdash; 차트 대시보드 구현과 데이터 시각화 팁</title>
      <link>https://allensdatablog.tistory.com/entry/%E2%9A%A1-Power-FX-%EC%8B%A4%EC%A0%84-%E2%80%94-%EC%B0%A8%ED%8A%B8-%EB%8C%80%EC%8B%9C%EB%B3%B4%EB%93%9C-%EA%B5%AC%ED%98%84%EA%B3%BC-%EB%8D%B0%EC%9D%B4%ED%84%B0-%EC%8B%9C%EA%B0%81%ED%99%94-%ED%8C%81</link>
      <description>&lt;blockquote data-end=&quot;207&quot; data-start=&quot;41&quot; data-ke-style=&quot;style1&quot;&gt;&lt;span style=&quot;font-family: 'Noto Serif KR';&quot;&gt;이번 포스트에선 Power Apps에서 차트(Chart) 대시보드를 구현하고,&lt;/span&gt;&lt;br /&gt;&lt;span style=&quot;font-family: 'Noto Serif KR';&quot;&gt;데이터를 시각적으로 보여주는 다양한 방법,&lt;/span&gt;&lt;br /&gt;&lt;span style=&quot;font-family: 'Noto Serif KR';&quot;&gt;실전 앱에서 바로 쓸 수 있는 대시보드 설계&amp;middot;활용 팁을 정리합니다.&lt;/span&gt;&lt;br /&gt;&lt;span style=&quot;font-family: 'Noto Serif KR';&quot;&gt;매출, 업무 현황, 트렌드, 집계 결과 등 실시간 데이터 분석에 바로 적용할 수 있습니다.&lt;/span&gt;&lt;/blockquote&gt;
&lt;hr data-end=&quot;212&quot; data-start=&quot;209&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;248&quot; data-start=&quot;214&quot; data-ke-size=&quot;size26&quot;&gt; ️ 기본 차트 컨트롤 활용(막대, 꺾은선, 원형 등)&lt;/h2&gt;
&lt;h3 data-end=&quot;280&quot; data-start=&quot;250&quot; data-ke-size=&quot;size23&quot;&gt;1) &lt;b&gt;차트 컨트롤 삽입 및 데이터 바인딩&lt;/b&gt;&lt;/h3&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;407&quot; data-start=&quot;281&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;376&quot; data-start=&quot;281&quot;&gt;Power Apps에서 기본 제공하는 &lt;b&gt;Column chart(세로 막대)&lt;/b&gt;, &lt;b&gt;Line chart(꺾은선)&lt;/b&gt;, &lt;b&gt;Pie chart(원형)&lt;/b&gt; 컨트롤 추가&lt;/li&gt;
&lt;li data-end=&quot;407&quot; data-start=&quot;377&quot;&gt;&lt;b&gt;Items&lt;/b&gt; 속성에 데이터 테이블/컬렉션 연결&lt;/li&gt;
&lt;/ul&gt;
&lt;div&gt;
&lt;div&gt;
&lt;pre id=&quot;code_1749023982463&quot; class=&quot;python&quot; data-ke-language=&quot;python&quot; data-ke-type=&quot;codeblock&quot;&gt;&lt;code&gt;// 예시: 월별 매출 데이터 컬렉션
colSalesData = [
    { Month: &quot;1월&quot;, Sales: 2000 },
    { Month: &quot;2월&quot;, Sales: 3500 },
    ...
]

// ColumnChart.Items
colSalesData&lt;/code&gt;&lt;/pre&gt;
&lt;/div&gt;
&lt;/div&gt;
&lt;hr data-end=&quot;579&quot; data-start=&quot;576&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h3 data-end=&quot;606&quot; data-start=&quot;581&quot; data-ke-size=&quot;size23&quot;&gt;2) &lt;b&gt;차트 축, 범례, 값 매핑&lt;/b&gt;&lt;/h3&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;694&quot; data-start=&quot;607&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;641&quot; data-start=&quot;607&quot;&gt;&lt;b&gt;Series&lt;/b&gt; : 차트에 표시할 값(예: Sales)&lt;/li&gt;
&lt;li data-end=&quot;676&quot; data-start=&quot;642&quot;&gt;&lt;b&gt;CategoryField&lt;/b&gt; : 분류(예: Month)&lt;/li&gt;
&lt;li data-end=&quot;694&quot; data-start=&quot;677&quot;&gt;차트 컨트롤 속성창에서 매핑&lt;/li&gt;
&lt;/ul&gt;
&lt;hr data-end=&quot;699&quot; data-start=&quot;696&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;721&quot; data-start=&quot;701&quot; data-ke-size=&quot;size26&quot;&gt; ️ 동적 필터/조건부 시각화&lt;/h2&gt;
&lt;h3 data-end=&quot;757&quot; data-start=&quot;723&quot; data-ke-size=&quot;size23&quot;&gt;1) &lt;b&gt;드롭다운/날짜 선택에 따라 차트 자동 갱신&lt;/b&gt;&lt;/h3&gt;
&lt;div&gt;
&lt;div&gt;
&lt;pre id=&quot;code_1749023988290&quot; class=&quot;python&quot; data-ke-language=&quot;python&quot; data-ke-type=&quot;codeblock&quot;&gt;&lt;code&gt;// ddYear.Selected.Value(연도), ddTeam.Selected.Value(팀)
Filter(
    colSalesData,
    Year = ddYear.Selected.Value &amp;amp;&amp;amp; Team = ddTeam.Selected.Value
)&lt;/code&gt;&lt;/pre&gt;
&lt;/div&gt;
&lt;/div&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;945&quot; data-start=&quot;921&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;945&quot; data-start=&quot;921&quot;&gt;사용자 입력에 따라 실시간 대시보드 변화&lt;/li&gt;
&lt;/ul&gt;
&lt;hr data-end=&quot;950&quot; data-start=&quot;947&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h3 data-end=&quot;978&quot; data-start=&quot;952&quot; data-ke-size=&quot;size23&quot;&gt;2) &lt;b&gt;차트와 갤러리/통계 값 연동&lt;/b&gt;&lt;/h3&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;1044&quot; data-start=&quot;979&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;1009&quot; data-start=&quot;979&quot;&gt;갤러리, 카드, 수치 요약 등과 함께 화면 배치&lt;/li&gt;
&lt;li data-end=&quot;1044&quot; data-start=&quot;1010&quot;&gt;차트 클릭 시 상세 데이터 연동(Selected 값 활용)&lt;/li&gt;
&lt;/ul&gt;
&lt;hr data-end=&quot;1049&quot; data-start=&quot;1046&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;1070&quot; data-start=&quot;1051&quot; data-ke-size=&quot;size26&quot;&gt; ️ 실전 대시보드 구성 팁&lt;/h2&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;1197&quot; data-start=&quot;1072&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;1119&quot; data-start=&quot;1072&quot;&gt;**요약/지표(카드) + 추이(차트) + 리스트(갤러리)**를 한 화면에 배치&lt;/li&gt;
&lt;li data-end=&quot;1158&quot; data-start=&quot;1120&quot;&gt;KPI(핵심 지표), 이상치 경고 등 조건부 색상/아이콘 활용&lt;/li&gt;
&lt;li data-end=&quot;1197&quot; data-start=&quot;1159&quot;&gt;최근 데이터/지난달/전년동기 등 비교값, 증감률 등도 카드로 표시&lt;/li&gt;
&lt;/ul&gt;
&lt;hr data-end=&quot;1202&quot; data-start=&quot;1199&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;1230&quot; data-start=&quot;1204&quot; data-ke-size=&quot;size26&quot;&gt; ️ 커스텀 시각화(갤러리, SVG 등)&lt;/h2&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;1351&quot; data-start=&quot;1232&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;1312&quot; data-start=&quot;1232&quot;&gt;기본 차트 기능 한계를 느낀다면&lt;br /&gt;갤러리+ProgressBar 조합, SVG 이미지/아이콘 동적 바인딩 등으로&lt;br /&gt;다양한 시각화 연출 가능&lt;/li&gt;
&lt;li data-end=&quot;1351&quot; data-start=&quot;1313&quot;&gt;Power BI를 함께 임베드하면 고급 분석 대시보드 구축도 가능&lt;/li&gt;
&lt;/ul&gt;
&lt;hr data-end=&quot;1356&quot; data-start=&quot;1353&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h3 data-end=&quot;1370&quot; data-start=&quot;1358&quot; data-ke-size=&quot;size23&quot;&gt;함수/속성 설명&lt;/h3&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;1495&quot; data-start=&quot;1372&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;1421&quot; data-start=&quot;1372&quot;&gt;&lt;b&gt;Filter, Sum, GroupBy 등&lt;/b&gt; : 차트/대시보드 데이터 집계에 활용&lt;/li&gt;
&lt;li data-end=&quot;1456&quot; data-start=&quot;1422&quot;&gt;&lt;b&gt;Items&lt;/b&gt; : 차트/갤러리/카드의 데이터 소스 연결&lt;/li&gt;
&lt;li data-end=&quot;1495&quot; data-start=&quot;1457&quot;&gt;&lt;b&gt;Selected&lt;/b&gt; : 사용자가 차트 등에서 선택한 항목 정보&lt;/li&gt;
&lt;/ul&gt;
&lt;hr data-end=&quot;1500&quot; data-start=&quot;1497&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;1509&quot; data-start=&quot;1502&quot; data-ke-size=&quot;size26&quot;&gt;실무 팁&lt;/h2&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;1650&quot; data-start=&quot;1511&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;1567&quot; data-start=&quot;1511&quot;&gt;데이터 컬렉션은 앱 시작 시 미리 로딩,&lt;br /&gt;필터 조건 변경 시 즉시 Refresh하는 패턴 권장&lt;/li&gt;
&lt;li data-end=&quot;1650&quot; data-start=&quot;1568&quot;&gt;차트 컨트롤 속성에서 Series, CategoryField 매핑이 맞지 않으면&lt;br /&gt;차트가 비어있거나 오류가 발생하므로 데이터 구조 반드시 확인&lt;/li&gt;
&lt;/ul&gt;</description>
      <category>Programming/Power Apps(PowerFx)</category>
      <category>MS</category>
      <category>powerapps</category>
      <category>powerfx</category>
      <category>앱개발</category>
      <category>자동화</category>
      <category>코딩</category>
      <author>Allen93</author>
      <guid isPermaLink="true">https://allensdatablog.tistory.com/442</guid>
      <comments>https://allensdatablog.tistory.com/entry/%E2%9A%A1-Power-FX-%EC%8B%A4%EC%A0%84-%E2%80%94-%EC%B0%A8%ED%8A%B8-%EB%8C%80%EC%8B%9C%EB%B3%B4%EB%93%9C-%EA%B5%AC%ED%98%84%EA%B3%BC-%EB%8D%B0%EC%9D%B4%ED%84%B0-%EC%8B%9C%EA%B0%81%ED%99%94-%ED%8C%81#entry442comment</comments>
      <pubDate>Tue, 23 Sep 2025 18:00:05 +0900</pubDate>
    </item>
    <item>
      <title>⚡ Power FX 실전 &amp;mdash; 외부 API/HTTP 연동으로 데이터 자동화 확장하기</title>
      <link>https://allensdatablog.tistory.com/entry/%E2%9A%A1-Power-FX-%EC%8B%A4%EC%A0%84-%E2%80%94-%EC%99%B8%EB%B6%80-APIHTTP-%EC%97%B0%EB%8F%99%EC%9C%BC%EB%A1%9C-%EB%8D%B0%EC%9D%B4%ED%84%B0-%EC%9E%90%EB%8F%99%ED%99%94-%ED%99%95%EC%9E%A5%ED%95%98%EA%B8%B0</link>
      <description>&lt;blockquote data-end=&quot;193&quot; data-start=&quot;49&quot; data-ke-style=&quot;style1&quot;&gt;&lt;span style=&quot;font-family: 'Noto Serif KR';&quot;&gt;이번 포스트에선 Power Apps에서 외부 시스템과 데이터를 주고받는&lt;/span&gt;&lt;br /&gt;&lt;span style=&quot;font-family: 'Noto Serif KR';&quot;&gt;API(HTTP 요청) 연동 구현 방법과,&lt;/span&gt;&lt;br /&gt;&lt;span style=&quot;font-family: 'Noto Serif KR';&quot;&gt;실무에서 많이 활용하는 데이터 자동화 시나리오 예시,&lt;/span&gt;&lt;br /&gt;&lt;span style=&quot;font-family: 'Noto Serif KR';&quot;&gt;Power FX와 Power Automate의 협업 패턴까지 정리합니다.&lt;/span&gt;&lt;/blockquote&gt;
&lt;hr data-end=&quot;198&quot; data-start=&quot;195&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;245&quot; data-start=&quot;200&quot; data-ke-size=&quot;size26&quot;&gt; ️ Power Apps + Power Automate로 API 호출 패턴&lt;/h2&gt;
&lt;p data-end=&quot;377&quot; data-start=&quot;247&quot; data-ke-size=&quot;size16&quot;&gt;Power Apps 자체에서는 REST API/HTTP 요청을 직접 보낼 수 없지만,&lt;br /&gt;&lt;b&gt;Power Automate(흔히 &amp;ldquo;흐름&amp;rdquo;이라고 부름)와 연결해&lt;/b&gt;&lt;br /&gt;외부 API 호출, 결과 반환, 데이터 저장까지 자동화할 수 있습니다.&lt;/p&gt;
&lt;hr data-end=&quot;382&quot; data-start=&quot;379&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h3 data-end=&quot;426&quot; data-start=&quot;384&quot; data-ke-size=&quot;size23&quot;&gt;1) &lt;b&gt;Power Automate에서 HTTP 요청 흐름 만들기&lt;/b&gt;&lt;/h3&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;534&quot; data-start=&quot;427&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;534&quot; data-start=&quot;427&quot;&gt;Power Automate에서 &lt;b&gt;새 흐름(Flow)&lt;/b&gt; 생성 &amp;rarr;&lt;br /&gt;&amp;ldquo;Power Apps에서 흐름 시작&amp;rdquo; 트리거 선택 &amp;rarr;&lt;br /&gt;&amp;ldquo;HTTP 요청&amp;rdquo; 액션 추가(외부 API/GET/POST 등)&lt;/li&gt;
&lt;/ul&gt;
&lt;hr data-end=&quot;539&quot; data-start=&quot;536&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h3 data-end=&quot;580&quot; data-start=&quot;541&quot; data-ke-size=&quot;size23&quot;&gt;2) &lt;b&gt;Power Apps에서 흐름 호출 및 파라미터 전달&lt;/b&gt;&lt;/h3&gt;
&lt;div&gt;
&lt;div&gt;
&lt;pre id=&quot;code_1749018928902&quot; class=&quot;python&quot; data-ke-language=&quot;python&quot; data-ke-type=&quot;codeblock&quot;&gt;&lt;code&gt;// 예시: WeatherFlow라는 Power Automate 흐름 실행, 도시명 전달
Set(weatherResult, WeatherFlow.Run(txtCity.Text))&lt;/code&gt;&lt;/pre&gt;
&lt;/div&gt;
&lt;/div&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;790&quot; data-start=&quot;696&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;756&quot; data-start=&quot;696&quot;&gt;&lt;b&gt;WeatherFlow.Run()&lt;/b&gt; : Power Automate에서 만든 흐름 실행(파라미터 전달)&lt;/li&gt;
&lt;li data-end=&quot;790&quot; data-start=&quot;757&quot;&gt;&lt;b&gt;txtCity.Text&lt;/b&gt; : 사용자가 입력한 도시명&lt;/li&gt;
&lt;/ul&gt;
&lt;hr data-end=&quot;795&quot; data-start=&quot;792&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h3 data-end=&quot;821&quot; data-start=&quot;797&quot; data-ke-size=&quot;size23&quot;&gt;3) &lt;b&gt;흐름에서 받은 결과 활용&lt;/b&gt;&lt;/h3&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;905&quot; data-start=&quot;822&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;876&quot; data-start=&quot;822&quot;&gt;흐름이 실행을 마치면 Power Apps로 응답 데이터(weatherResult)가 반환됨&lt;/li&gt;
&lt;li data-end=&quot;905&quot; data-start=&quot;877&quot;&gt;라벨, 갤러리 등에서 해당 변수의 값 활용 가능&lt;/li&gt;
&lt;/ul&gt;
&lt;div&gt;
&lt;div&gt;
&lt;pre id=&quot;code_1749018935674&quot; class=&quot;python&quot; data-ke-language=&quot;python&quot; data-ke-type=&quot;codeblock&quot;&gt;&lt;code&gt;// 예: 결과를 라벨에 표시
lblWeather.Text = weatherResult&lt;/code&gt;&lt;/pre&gt;
&lt;/div&gt;
&lt;/div&gt;
&lt;hr data-end=&quot;975&quot; data-start=&quot;972&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;998&quot; data-start=&quot;977&quot; data-ke-size=&quot;size26&quot;&gt; ️ 활용 가능한 대표 시나리오&lt;/h2&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;1114&quot; data-start=&quot;1000&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;1044&quot; data-start=&quot;1000&quot;&gt;실시간 환율, 날씨, 뉴스, 사내 시스템 등 외부 데이터 앱 내 실시간 표시&lt;/li&gt;
&lt;li data-end=&quot;1080&quot; data-start=&quot;1045&quot;&gt;ERP, CRM 등 백엔드 시스템과 자동 연동(업무 자동화)&lt;/li&gt;
&lt;li data-end=&quot;1114&quot; data-start=&quot;1081&quot;&gt;파일 업로드/다운로드, 메일 발송, 승인/보고 자동화 등&lt;/li&gt;
&lt;/ul&gt;
&lt;hr data-end=&quot;1119&quot; data-start=&quot;1116&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h3 data-end=&quot;1133&quot; data-start=&quot;1121&quot; data-ke-size=&quot;size23&quot;&gt;함수/속성 설명&lt;/h3&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;1262&quot; data-start=&quot;1135&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;1165&quot; data-start=&quot;1135&quot;&gt;&lt;b&gt;Set(변수, 값)&lt;/b&gt; : 흐름 실행 결과 저장&lt;/li&gt;
&lt;li data-end=&quot;1211&quot; data-start=&quot;1166&quot;&gt;&lt;b&gt;FlowName.Run(파라미터)&lt;/b&gt; : Power Apps에서 흐름 호출&lt;/li&gt;
&lt;li data-end=&quot;1262&quot; data-start=&quot;1212&quot;&gt;&lt;b&gt;Power Automate 흐름&lt;/b&gt; : HTTP, 데이터 파싱, 응답 반환까지 담당&lt;/li&gt;
&lt;/ul&gt;
&lt;hr data-end=&quot;1267&quot; data-start=&quot;1264&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;1276&quot; data-start=&quot;1269&quot; data-ke-size=&quot;size26&quot;&gt;실무 팁&lt;/h2&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;1425&quot; data-start=&quot;1278&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;1349&quot; data-start=&quot;1278&quot;&gt;Power Automate 흐름은 &lt;b&gt;응답(Response) 액션&lt;/b&gt;을 꼭 추가해야&lt;br /&gt;Power Apps로 데이터가 반환됨&lt;/li&gt;
&lt;li data-end=&quot;1391&quot; data-start=&quot;1350&quot;&gt;흐름과 앱 간 파라미터 전달 시 형식/이름을 일치시켜야 오류 없이 동작&lt;/li&gt;
&lt;li data-end=&quot;1425&quot; data-start=&quot;1392&quot;&gt;대용량/민감 데이터는 API 사용량&amp;middot;보안정책도 함께 고려&lt;/li&gt;
&lt;/ul&gt;
&lt;hr data-end=&quot;1430&quot; data-start=&quot;1427&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;1438&quot; data-start=&quot;1432&quot; data-ke-size=&quot;size26&quot;&gt;마무리&lt;/h2&gt;
&lt;p data-end=&quot;1572&quot; data-start=&quot;1440&quot; data-ke-size=&quot;size16&quot;&gt;Power Apps와 Power Automate를 연계하면&lt;br /&gt;앱에서 직접 할 수 없던 API 연동, 외부 데이터 활용,&lt;br /&gt;자동화 기능까지 손쉽게 확장할 수 있습니다.&lt;br /&gt;최신 사내/외부 시스템 연동 요구에 꼭 필요한 실전 패턴입니다.&lt;/p&gt;
&lt;p data-end=&quot;1667&quot; data-start=&quot;1594&quot; data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;</description>
      <category>Programming/Power Apps(PowerFx)</category>
      <category>API</category>
      <category>http</category>
      <category>powerapps</category>
      <category>Powerautomate</category>
      <category>powerfx</category>
      <category>실전팁</category>
      <category>앱개발</category>
      <category>외부연동</category>
      <category>흐름</category>
      <author>Allen93</author>
      <guid isPermaLink="true">https://allensdatablog.tistory.com/441</guid>
      <comments>https://allensdatablog.tistory.com/entry/%E2%9A%A1-Power-FX-%EC%8B%A4%EC%A0%84-%E2%80%94-%EC%99%B8%EB%B6%80-APIHTTP-%EC%97%B0%EB%8F%99%EC%9C%BC%EB%A1%9C-%EB%8D%B0%EC%9D%B4%ED%84%B0-%EC%9E%90%EB%8F%99%ED%99%94-%ED%99%95%EC%9E%A5%ED%95%98%EA%B8%B0#entry441comment</comments>
      <pubDate>Sat, 20 Sep 2025 17:28:14 +0900</pubDate>
    </item>
    <item>
      <title>⚡ Power FX 실전 &amp;mdash; 다중 파일 첨부 고급 활용법</title>
      <link>https://allensdatablog.tistory.com/entry/%E2%9A%A1-Power-FX-%EC%8B%A4%EC%A0%84-%E2%80%94-%EB%8B%A4%EC%A4%91-%ED%8C%8C%EC%9D%BC-%EC%B2%A8%EB%B6%80-%EA%B3%A0%EA%B8%89-%ED%99%9C%EC%9A%A9%EB%B2%95</link>
      <description>&lt;blockquote data-end=&quot;212&quot; data-start=&quot;35&quot; data-ke-style=&quot;style1&quot;&gt;&lt;span style=&quot;font-family: 'Noto Serif KR';&quot;&gt;이번 포스트에선 Power Apps에서 여러 개의 파일(사진, 문서 등)을 한 번에 첨부하고,&lt;/span&gt;&lt;br /&gt;&lt;span style=&quot;font-family: 'Noto Serif KR';&quot;&gt;각 파일의 상태 관리, 미리보기, 삭제, 일괄 저장까지 지원하는 &lt;/span&gt;&lt;span style=&quot;font-family: 'Noto Serif KR';&quot;&gt;고급 다중 파일 첨부 구현 패턴을 정리합니다.&lt;/span&gt;&lt;br /&gt;&lt;span style=&quot;font-family: 'Noto Serif KR';&quot;&gt;보고서 제출, 견적서&amp;middot;계약서 관리, 업무자료 일괄 업로드 등 실무에 바로 적용할 수 있습니다.&lt;/span&gt;&lt;/blockquote&gt;
&lt;hr data-end=&quot;217&quot; data-start=&quot;214&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;252&quot; data-start=&quot;219&quot; data-ke-size=&quot;size26&quot;&gt; ️ Attachment 컨트롤로 다중 파일 첨부하기&lt;/h2&gt;
&lt;h3 data-end=&quot;291&quot; data-start=&quot;254&quot; data-ke-size=&quot;size23&quot;&gt;1) &lt;b&gt;폼(Form)에 Attachment 컨트롤 추가&lt;/b&gt;&lt;/h3&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;386&quot; data-start=&quot;292&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;348&quot; data-start=&quot;292&quot;&gt;SharePoint/Form 데이터 소스 연결 시 &lt;b&gt;Attachments&lt;/b&gt; 필드 자동 생성&lt;/li&gt;
&lt;li data-end=&quot;386&quot; data-start=&quot;349&quot;&gt;단일/다중 파일 모두 지원, 드래그 앤 드롭 및 파일 선택 가능&lt;/li&gt;
&lt;/ul&gt;
&lt;hr data-end=&quot;391&quot; data-start=&quot;388&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h3 data-end=&quot;418&quot; data-start=&quot;393&quot; data-ke-size=&quot;size23&quot;&gt;2) &lt;b&gt;첨부 파일 목록/상태 관리&lt;/b&gt;&lt;/h3&gt;
&lt;div&gt;
&lt;div&gt;
&lt;pre id=&quot;code_1749018111134&quot; class=&quot;python&quot; data-ke-language=&quot;python&quot; data-ke-type=&quot;codeblock&quot;&gt;&lt;code&gt;// 첨부파일 리스트 표시 (갤러리, 카드 등)
AttachmentControl.Attachments&lt;/code&gt;&lt;/pre&gt;
&lt;/div&gt;
&lt;/div&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;568&quot; data-start=&quot;491&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;530&quot; data-start=&quot;491&quot;&gt;&lt;b&gt;AttachmentControl&lt;/b&gt; : 첨부파일 컨트롤 이름&lt;/li&gt;
&lt;li data-end=&quot;568&quot; data-start=&quot;531&quot;&gt;&lt;b&gt;.Attachments&lt;/b&gt; : 현재 첨부된 모든 파일의 배열&lt;/li&gt;
&lt;/ul&gt;
&lt;hr data-end=&quot;573&quot; data-start=&quot;570&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h3 data-end=&quot;601&quot; data-start=&quot;575&quot; data-ke-size=&quot;size23&quot;&gt;3) &lt;b&gt;첨부파일 미리보기/삭제 기능&lt;/b&gt;&lt;/h3&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;710&quot; data-start=&quot;602&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;638&quot; data-start=&quot;602&quot;&gt;이미지, PDF 등은 &lt;b&gt;미리보기(Preview)&lt;/b&gt; 지원&lt;/li&gt;
&lt;li data-end=&quot;664&quot; data-start=&quot;639&quot;&gt;각 파일 옆에 &lt;b&gt;삭제 아이콘&lt;/b&gt; 배치&lt;/li&gt;
&lt;li data-end=&quot;710&quot; data-start=&quot;665&quot;&gt;갤러리 내 Visible, RemoveFile 함수 조합으로 파일별 삭제 구현&lt;/li&gt;
&lt;/ul&gt;
&lt;div&gt;
&lt;div&gt;
&lt;pre id=&quot;code_1749018122755&quot; class=&quot;python&quot; data-ke-language=&quot;python&quot; data-ke-type=&quot;codeblock&quot;&gt;&lt;code&gt;// 삭제 버튼 OnSelect
Remove(AttachmentControl.Attachments, ThisItem)&lt;/code&gt;&lt;/pre&gt;
&lt;/div&gt;
&lt;/div&gt;
&lt;hr data-end=&quot;797&quot; data-start=&quot;794&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h3 data-end=&quot;832&quot; data-start=&quot;799&quot; data-ke-size=&quot;size23&quot;&gt;4) &lt;b&gt;첨부파일 데이터와 본문 데이터 일괄 저장&lt;/b&gt;&lt;/h3&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;893&quot; data-start=&quot;833&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;893&quot; data-start=&quot;833&quot;&gt;SubmitForm 또는 Patch 실행 시&lt;br /&gt;첨부파일 컨트롤의 내용도 함께 데이터 소스에 자동 업로드&lt;/li&gt;
&lt;/ul&gt;
&lt;hr data-end=&quot;898&quot; data-start=&quot;895&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;928&quot; data-start=&quot;900&quot; data-ke-size=&quot;size26&quot;&gt; ️ 실전 활용: 첨부파일에 추가 정보 입력&lt;/h2&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;1067&quot; data-start=&quot;930&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;997&quot; data-start=&quot;930&quot;&gt;갤러리로 첨부파일 리스트를 표시하고,&lt;br /&gt;각 파일 옆에 &amp;ldquo;설명&amp;rdquo;, &amp;ldquo;카테고리&amp;rdquo;, &amp;ldquo;참고사항&amp;rdquo; 등 추가 입력란 배치&lt;/li&gt;
&lt;li data-end=&quot;1038&quot; data-start=&quot;998&quot;&gt;갤러리 Selected/ThisItem을 활용해 파일별 정보 입력&lt;/li&gt;
&lt;li data-end=&quot;1067&quot; data-start=&quot;1039&quot;&gt;최종 저장 시 파일 정보+메타데이터 함께 업로드&lt;/li&gt;
&lt;/ul&gt;
&lt;hr data-end=&quot;1072&quot; data-start=&quot;1069&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h3 data-end=&quot;1086&quot; data-start=&quot;1074&quot; data-ke-size=&quot;size23&quot;&gt;함수/속성 설명&lt;/h3&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;1247&quot; data-start=&quot;1088&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;1135&quot; data-start=&quot;1088&quot;&gt;&lt;b&gt;AttachmentControl.Attachments&lt;/b&gt; : 첨부된 파일 배열&lt;/li&gt;
&lt;li data-end=&quot;1176&quot; data-start=&quot;1136&quot;&gt;&lt;b&gt;Remove(컬렉션, 항목)&lt;/b&gt; : 파일 목록에서 해당 파일 제거&lt;/li&gt;
&lt;li data-end=&quot;1211&quot; data-start=&quot;1177&quot;&gt;&lt;b&gt;SubmitForm&lt;/b&gt; : 본문+첨부파일 한 번에 저장&lt;/li&gt;
&lt;li data-end=&quot;1247&quot; data-start=&quot;1212&quot;&gt;&lt;b&gt;ThisItem&lt;/b&gt; : 갤러리 내 현재 선택된 파일 참조&lt;/li&gt;
&lt;/ul&gt;
&lt;hr data-end=&quot;1252&quot; data-start=&quot;1249&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;1265&quot; data-start=&quot;1254&quot; data-ke-size=&quot;size26&quot;&gt;실무 활용 예시&lt;/h2&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;1363&quot; data-start=&quot;1267&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;1302&quot; data-start=&quot;1267&quot;&gt;각종 제출물, 계약&amp;middot;보고자료, 견적서 등 다중 첨부파일 처리&lt;/li&gt;
&lt;li data-end=&quot;1335&quot; data-start=&quot;1303&quot;&gt;사진+설명 동시 저장(품질 이슈 보고, 점검 결과 등)&lt;/li&gt;
&lt;li data-end=&quot;1363&quot; data-start=&quot;1336&quot;&gt;승인/검토용 자료 일괄 업로드, 일괄 다운로드&lt;/li&gt;
&lt;/ul&gt;
&lt;hr data-end=&quot;1368&quot; data-start=&quot;1365&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;1377&quot; data-start=&quot;1370&quot; data-ke-size=&quot;size26&quot;&gt;실무 팁&lt;/h2&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;1570&quot; data-start=&quot;1379&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;1424&quot; data-start=&quot;1379&quot;&gt;첨부파일 용량/확장자 제한은 컨트롤 속성 및 앱 안내 메시지로 명확히 설정&lt;/li&gt;
&lt;li data-end=&quot;1511&quot; data-start=&quot;1425&quot;&gt;데이터 소스에 따라 첨부파일 개수&amp;middot;크기 제한이 다르므로(SharePoint, Dataverse 등)&lt;br /&gt;배포 전 반드시 실제 데이터 업로드 테스트 필수&lt;/li&gt;
&lt;li data-end=&quot;1570&quot; data-start=&quot;1512&quot;&gt;파일 미리보기 기능과 상태 표시(업로드 중, 성공, 실패 등) 구현 시&lt;br /&gt;사용자 경험이 크게 향상됨&lt;/li&gt;
&lt;/ul&gt;
&lt;hr data-end=&quot;1575&quot; data-start=&quot;1572&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;1583&quot; data-start=&quot;1577&quot; data-ke-size=&quot;size26&quot;&gt;마무리&lt;/h2&gt;
&lt;p data-end=&quot;1712&quot; data-start=&quot;1585&quot; data-ke-size=&quot;size16&quot;&gt;다중 파일 첨부는 단순 업로드를 넘어&lt;br /&gt;파일별 상태 관리, 설명 등 부가정보와 결합하면&lt;br /&gt;실무 앱의 활용성과 완성도가 크게 높아집니다.&lt;br /&gt;Power FX와 Attachment 컨트롤의 다양한 속성을 적극적으로 활용해보세요.&lt;/p&gt;
&lt;p data-end=&quot;1805&quot; data-start=&quot;1734&quot; data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;</description>
      <category>Programming/Power Apps(PowerFx)</category>
      <category>attachment</category>
      <category>powerapps</category>
      <category>powerfx</category>
      <category>갤러리</category>
      <category>다중파일</category>
      <category>업로드</category>
      <category>첨부파일</category>
      <author>Allen93</author>
      <guid isPermaLink="true">https://allensdatablog.tistory.com/440</guid>
      <comments>https://allensdatablog.tistory.com/entry/%E2%9A%A1-Power-FX-%EC%8B%A4%EC%A0%84-%E2%80%94-%EB%8B%A4%EC%A4%91-%ED%8C%8C%EC%9D%BC-%EC%B2%A8%EB%B6%80-%EA%B3%A0%EA%B8%89-%ED%99%9C%EC%9A%A9%EB%B2%95#entry440comment</comments>
      <pubDate>Tue, 16 Sep 2025 16:22:23 +0900</pubDate>
    </item>
    <item>
      <title>⚡ Power FX 실전 &amp;mdash; 조건부 접근 제어와 사용자별 맞춤 데이터 뷰 구현</title>
      <link>https://allensdatablog.tistory.com/entry/%E2%9A%A1-Power-FX-%EC%8B%A4%EC%A0%84-%E2%80%94-%EC%A1%B0%EA%B1%B4%EB%B6%80-%EC%A0%91%EA%B7%BC-%EC%A0%9C%EC%96%B4%EC%99%80-%EC%82%AC%EC%9A%A9%EC%9E%90%EB%B3%84-%EB%A7%9E%EC%B6%A4-%EB%8D%B0%EC%9D%B4%ED%84%B0-%EB%B7%B0-%EA%B5%AC%ED%98%84</link>
      <description>&lt;blockquote data-end=&quot;224&quot; data-start=&quot;47&quot; data-ke-style=&quot;style1&quot;&gt;&lt;span style=&quot;font-family: 'Noto Serif KR';&quot;&gt;이번 포스트에선 Power Apps에서 사용자 역할, 로그인 정보, 데이터 권한에 따라&lt;/span&gt;&lt;br /&gt;&lt;span style=&quot;font-family: 'Noto Serif KR';&quot;&gt;&lt;br /&gt;화면, 버튼, 데이터 뷰를 동적으로 제어하는 대표적인 Power FX 구현 패턴을 정리합니다.&lt;/span&gt;&lt;br /&gt;&lt;span style=&quot;font-family: 'Noto Serif KR';&quot;&gt;조직 내 관리자/일반 사용자/게스트별 기능 제한,&lt;/span&gt;&lt;br /&gt;&lt;span style=&quot;font-family: 'Noto Serif KR';&quot;&gt;사용자별 맞춤 대시보드 등 다양한 실무 요구에 대응할 수 있습니다.&lt;/span&gt;&lt;/blockquote&gt;
&lt;hr data-end=&quot;229&quot; data-start=&quot;226&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;253&quot; data-start=&quot;231&quot; data-ke-size=&quot;size26&quot;&gt; ️ 조건부 화면&amp;middot;버튼 접근 제어&lt;/h2&gt;
&lt;h3 data-end=&quot;286&quot; data-start=&quot;255&quot; data-ke-size=&quot;size23&quot;&gt;1) &lt;b&gt;로그인 사용자 이메일 기반 접근 제한&lt;/b&gt;&lt;/h3&gt;
&lt;div&gt;
&lt;div&gt;
&lt;pre id=&quot;code_1749017892987&quot; class=&quot;python&quot; data-ke-language=&quot;python&quot; data-ke-type=&quot;codeblock&quot;&gt;&lt;code&gt;// 관리자만 설정 버튼 볼 수 있게
btnSettings.Visible = User().Email in [&quot;admin@company.com&quot;, &quot;manager@company.com&quot;]&lt;/code&gt;&lt;/pre&gt;
&lt;/div&gt;
&lt;/div&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;456&quot; data-start=&quot;406&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;456&quot; data-start=&quot;406&quot;&gt;&lt;b&gt;btnSettings.Visible&lt;/b&gt; : 관리자 이메일 목록에 포함된 경우만 노출&lt;/li&gt;
&lt;/ul&gt;
&lt;hr data-end=&quot;461&quot; data-start=&quot;458&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h3 data-end=&quot;518&quot; data-start=&quot;463&quot; data-ke-size=&quot;size23&quot;&gt;2) &lt;b&gt;외부 권한 테이블 연동(SharePoint, Excel, Dataverse 등)&lt;/b&gt;&lt;/h3&gt;
&lt;div&gt;
&lt;div&gt;
&lt;pre id=&quot;code_1749017917790&quot; class=&quot;python&quot; data-ke-language=&quot;python&quot; data-ke-type=&quot;codeblock&quot;&gt;&lt;code&gt;// 권한 관리 테이블(AdminUsers)와 연동
btnSettings.Visible = !IsBlank(LookUp(AdminUsers, Email = User().Email))&lt;/code&gt;&lt;/pre&gt;
&lt;/div&gt;
&lt;/div&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;671&quot; data-start=&quot;636&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;671&quot; data-start=&quot;636&quot;&gt;&lt;b&gt;AdminUsers&lt;/b&gt; : 권한 있는 사용자 명단 테이블&lt;/li&gt;
&lt;/ul&gt;
&lt;hr data-end=&quot;676&quot; data-start=&quot;673&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h3 data-end=&quot;703&quot; data-start=&quot;678&quot; data-ke-size=&quot;size23&quot;&gt;3) &lt;b&gt;화면 진입 자체를 제한하기&lt;/b&gt;&lt;/h3&gt;
&lt;div&gt;
&lt;div&gt;
&lt;pre id=&quot;code_1749017929713&quot; class=&quot;python&quot; data-ke-language=&quot;python&quot; data-ke-type=&quot;codeblock&quot;&gt;&lt;code&gt;// App OnStart 혹은 화면 진입 시
If(
    !IsBlank(LookUp(AdminUsers, Email = User().Email)),
    Navigate(ScreenAdmin),
    Notify(&quot;접근 권한이 없습니다.&quot;, NotificationType.Error)
)&lt;/code&gt;&lt;/pre&gt;
&lt;/div&gt;
&lt;/div&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;912&quot; data-start=&quot;885&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;912&quot; data-start=&quot;885&quot;&gt;관리자가 아니면 화면 전환 차단 + 안내 알림&lt;/li&gt;
&lt;/ul&gt;
&lt;hr data-end=&quot;917&quot; data-start=&quot;914&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;942&quot; data-start=&quot;919&quot; data-ke-size=&quot;size26&quot;&gt; ️ 사용자별 맞춤 데이터 뷰 구현&lt;/h2&gt;
&lt;h3 data-end=&quot;974&quot; data-start=&quot;944&quot; data-ke-size=&quot;size23&quot;&gt;1) &lt;b&gt;로그인 사용자에게만 내 데이터 표시&lt;/b&gt;&lt;/h3&gt;
&lt;div&gt;
&lt;div&gt;
&lt;pre id=&quot;code_1749017947780&quot; class=&quot;python&quot; data-ke-language=&quot;python&quot; data-ke-type=&quot;codeblock&quot;&gt;&lt;code&gt;// 갤러리 Items
Filter(
    Orders,
    UserEmail = User().Email
)&lt;/code&gt;&lt;/pre&gt;
&lt;/div&gt;
&lt;/div&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;1114&quot; data-start=&quot;1054&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;1079&quot; data-start=&quot;1054&quot;&gt;&lt;b&gt;Orders&lt;/b&gt; : 전체 데이터 테이블&lt;/li&gt;
&lt;li data-end=&quot;1114&quot; data-start=&quot;1080&quot;&gt;&lt;b&gt;UserEmail&lt;/b&gt; : 각 행에 저장된 담당자 이메일&lt;/li&gt;
&lt;/ul&gt;
&lt;hr data-end=&quot;1119&quot; data-start=&quot;1116&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h3 data-end=&quot;1147&quot; data-start=&quot;1121&quot; data-ke-size=&quot;size23&quot;&gt;2) &lt;b&gt;팀/조직별 데이터 분리 표시&lt;/b&gt;&lt;/h3&gt;
&lt;div&gt;
&lt;div&gt;
&lt;pre id=&quot;code_1749017955026&quot; class=&quot;python&quot; data-ke-language=&quot;python&quot; data-ke-type=&quot;codeblock&quot;&gt;&lt;code&gt;Filter(
    Projects,
    Team = ddTeam.Selected.Value
)&lt;/code&gt;&lt;/pre&gt;
&lt;/div&gt;
&lt;/div&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;1274&quot; data-start=&quot;1220&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;1246&quot; data-start=&quot;1220&quot;&gt;&lt;b&gt;ddTeam&lt;/b&gt; : 드롭다운에서 팀 선택&lt;/li&gt;
&lt;li data-end=&quot;1274&quot; data-start=&quot;1247&quot;&gt;&lt;b&gt;Projects&lt;/b&gt; : 팀별 프로젝트 목록&lt;/li&gt;
&lt;/ul&gt;
&lt;hr data-end=&quot;1279&quot; data-start=&quot;1276&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h3 data-end=&quot;1309&quot; data-start=&quot;1281&quot; data-ke-size=&quot;size23&quot;&gt;3) &lt;b&gt;사용자 권한별 데이터 범위 제한&lt;/b&gt;&lt;/h3&gt;
&lt;div&gt;
&lt;div&gt;
&lt;pre id=&quot;code_1749017962565&quot; class=&quot;python&quot; data-ke-language=&quot;python&quot; data-ke-type=&quot;codeblock&quot;&gt;&lt;code&gt;// 예: 관리자면 전체, 일반 사용자는 본인 데이터만
If(
    User().Email in [&quot;admin@company.com&quot;, &quot;manager@company.com&quot;],
    Orders,
    Filter(Orders, UserEmail = User().Email)
)&lt;/code&gt;&lt;/pre&gt;
&lt;/div&gt;
&lt;/div&gt;
&lt;hr data-end=&quot;1489&quot; data-start=&quot;1486&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h3 data-end=&quot;1503&quot; data-start=&quot;1491&quot; data-ke-size=&quot;size23&quot;&gt;함수/속성 설명&lt;/h3&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;1646&quot; data-start=&quot;1505&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;1541&quot; data-start=&quot;1505&quot;&gt;&lt;b&gt;User().Email&lt;/b&gt; : 현재 로그인 사용자의 이메일&lt;/li&gt;
&lt;li data-end=&quot;1581&quot; data-start=&quot;1542&quot;&gt;&lt;b&gt;LookUp(테이블, 조건)&lt;/b&gt; : 권한 테이블에서 사용자 검색&lt;/li&gt;
&lt;li data-end=&quot;1614&quot; data-start=&quot;1582&quot;&gt;&lt;b&gt;Filter(테이블, 조건)&lt;/b&gt; : 데이터 행 제한&lt;/li&gt;
&lt;li data-end=&quot;1646&quot; data-start=&quot;1615&quot;&gt;&lt;b&gt;Visible&lt;/b&gt; : 컨트롤(버튼 등) 노출 제어&lt;/li&gt;
&lt;/ul&gt;
&lt;hr data-end=&quot;1651&quot; data-start=&quot;1648&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;1664&quot; data-start=&quot;1653&quot; data-ke-size=&quot;size26&quot;&gt;실무 활용 예시&lt;/h2&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;1741&quot; data-start=&quot;1666&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;1695&quot; data-start=&quot;1666&quot;&gt;승인자/관리자/사용자 역할별 화면&amp;middot;기능 차등 제공&lt;/li&gt;
&lt;li data-end=&quot;1717&quot; data-start=&quot;1696&quot;&gt;부서/지점/지역별 데이터 자동 분리&lt;/li&gt;
&lt;li data-end=&quot;1741&quot; data-start=&quot;1718&quot;&gt;개인정보 보호 등 법적 요건 준수 구현&lt;/li&gt;
&lt;/ul&gt;
&lt;hr data-end=&quot;1746&quot; data-start=&quot;1743&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;1755&quot; data-start=&quot;1748&quot; data-ke-size=&quot;size26&quot;&gt;실무 팁&lt;/h2&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;1852&quot; data-start=&quot;1757&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;1779&quot; data-start=&quot;1757&quot;&gt;권한 관리 테이블은 정기적으로 최신화&lt;/li&gt;
&lt;li data-end=&quot;1821&quot; data-start=&quot;1780&quot;&gt;Visible, Items 등 컨트롤 속성에 조건부 수식을 명확히 적용&lt;/li&gt;
&lt;li data-end=&quot;1852&quot; data-start=&quot;1822&quot;&gt;사용자 맞춤 데이터는 성능/보안 모두 고려하여 구현&lt;/li&gt;
&lt;/ul&gt;
&lt;hr data-end=&quot;1857&quot; data-start=&quot;1854&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;1865&quot; data-start=&quot;1859&quot; data-ke-size=&quot;size26&quot;&gt;마무리&lt;/h2&gt;
&lt;p data-end=&quot;1997&quot; data-start=&quot;1867&quot; data-ke-size=&quot;size16&quot;&gt;조건부 접근 제어와 맞춤형 데이터 뷰는&lt;br /&gt;보안과 사용자 경험을 동시에 향상시키는 실무 필수 기능입니다.&lt;br /&gt;Power FX의 기본 함수와 데이터 소스 연동만으로&lt;br /&gt;강력한 권한 관리와 사용자별 맞춤 앱을 빠르게 구축할 수 있습니다.&lt;/p&gt;
&lt;p data-end=&quot;2089&quot; data-start=&quot;2019&quot; data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;</description>
      <category>Programming/Power Apps(PowerFx)</category>
      <category>Filter</category>
      <category>Lookup</category>
      <category>powerapps</category>
      <category>powerfx</category>
      <category>user</category>
      <category>권한제어</category>
      <category>맞춤뷰</category>
      <author>Allen93</author>
      <guid isPermaLink="true">https://allensdatablog.tistory.com/439</guid>
      <comments>https://allensdatablog.tistory.com/entry/%E2%9A%A1-Power-FX-%EC%8B%A4%EC%A0%84-%E2%80%94-%EC%A1%B0%EA%B1%B4%EB%B6%80-%EC%A0%91%EA%B7%BC-%EC%A0%9C%EC%96%B4%EC%99%80-%EC%82%AC%EC%9A%A9%EC%9E%90%EB%B3%84-%EB%A7%9E%EC%B6%A4-%EB%8D%B0%EC%9D%B4%ED%84%B0-%EB%B7%B0-%EA%B5%AC%ED%98%84#entry439comment</comments>
      <pubDate>Sat, 13 Sep 2025 16:19:41 +0900</pubDate>
    </item>
    <item>
      <title>⚡ Power FX 실전 &amp;mdash; 앱 내 일정 관리, 캘린더 및 일정 알림 구현법</title>
      <link>https://allensdatablog.tistory.com/entry/%E2%9A%A1-Power-FX-%EC%8B%A4%EC%A0%84-%E2%80%94-%EC%95%B1-%EB%82%B4-%EC%9D%BC%EC%A0%95-%EA%B4%80%EB%A6%AC-%EC%BA%98%EB%A6%B0%EB%8D%94-%EB%B0%8F-%EC%9D%BC%EC%A0%95-%EC%95%8C%EB%A6%BC-%EA%B5%AC%ED%98%84%EB%B2%95</link>
      <description>&lt;blockquote data-end=&quot;315&quot; data-start=&quot;141&quot; data-ke-style=&quot;style1&quot;&gt;&lt;span style=&quot;font-family: 'Noto Serif KR';&quot;&gt;이번 포스트에선 Power Apps에서 업무 일정, 회의 예약, 프로젝트 마감 등&lt;/span&gt;&lt;br /&gt;&lt;span style=&quot;font-family: 'Noto Serif KR';&quot;&gt;캘린더(Calendar) 및 일정 관리 기능을 구현하는 실전 Power FX 활용법을 정리합니다.&lt;/span&gt;&lt;br /&gt;&lt;span style=&quot;font-family: 'Noto Serif KR';&quot;&gt;예약, 할 일(To-Do), 마감일, 반복 일정 등 다양한 실무 시나리오에 바로 쓸 수 있는 코드와 팁을 담았습니다.&lt;/span&gt;&lt;/blockquote&gt;
&lt;hr data-end=&quot;320&quot; data-start=&quot;317&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;346&quot; data-start=&quot;322&quot; data-ke-size=&quot;size26&quot;&gt; ️ 일정(이벤트) 데이터 구조 설계&lt;/h2&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;512&quot; data-start=&quot;348&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;368&quot; data-start=&quot;348&quot;&gt;&lt;b&gt;EventID&lt;/b&gt; : 고유번호&lt;/li&gt;
&lt;li data-end=&quot;388&quot; data-start=&quot;369&quot;&gt;&lt;b&gt;Title&lt;/b&gt; : 일정 제목&lt;/li&gt;
&lt;li data-end=&quot;425&quot; data-start=&quot;389&quot;&gt;&lt;b&gt;StartDateTime&lt;/b&gt; : 시작일시(DateTime)&lt;/li&gt;
&lt;li data-end=&quot;460&quot; data-start=&quot;426&quot;&gt;&lt;b&gt;EndDateTime&lt;/b&gt; : 종료일시(DateTime)&lt;/li&gt;
&lt;li data-end=&quot;486&quot; data-start=&quot;461&quot;&gt;&lt;b&gt;Description&lt;/b&gt; : 상세 설명&lt;/li&gt;
&lt;li data-end=&quot;512&quot; data-start=&quot;487&quot;&gt;&lt;b&gt;UserEmail&lt;/b&gt; : 담당자(선택)&lt;/li&gt;
&lt;/ul&gt;
&lt;p data-end=&quot;563&quot; data-start=&quot;514&quot; data-ke-size=&quot;size16&quot;&gt;데이터 소스는 SharePoint, Excel, Dataverse 등 자유롭게 사용 가능&lt;/p&gt;
&lt;hr data-end=&quot;568&quot; data-start=&quot;565&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;587&quot; data-start=&quot;570&quot; data-ke-size=&quot;size26&quot;&gt; ️ 일정 추가 및 표시&lt;/h2&gt;
&lt;h3 data-end=&quot;609&quot; data-start=&quot;589&quot; data-ke-size=&quot;size23&quot;&gt;1) &lt;b&gt;일정 등록(추가)&lt;/b&gt;&lt;/h3&gt;
&lt;div&gt;
&lt;div&gt;
&lt;pre id=&quot;code_1749017232534&quot; class=&quot;python&quot; data-ke-language=&quot;python&quot; data-ke-type=&quot;codeblock&quot;&gt;&lt;code&gt;// btnAddEvent.OnSelect
Patch(
    CalendarEvents,
    Defaults(CalendarEvents),
    {
        Title: txtTitle.Text,
        StartDateTime: dtpStart.SelectedDate,
        EndDateTime: dtpEnd.SelectedDate,
        Description: txtDescription.Text,
        UserEmail: User().Email
    }
)&lt;/code&gt;&lt;/pre&gt;
&lt;/div&gt;
&lt;/div&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;1022&quot; data-start=&quot;912&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;944&quot; data-start=&quot;912&quot;&gt;&lt;b&gt;CalendarEvents&lt;/b&gt; : 일정 저장 테이블&lt;/li&gt;
&lt;li data-end=&quot;983&quot; data-start=&quot;945&quot;&gt;&lt;b&gt;txtTitle, txtDescription&lt;/b&gt; : 입력 필드&lt;/li&gt;
&lt;li data-end=&quot;1022&quot; data-start=&quot;984&quot;&gt;&lt;b&gt;dtpStart, dtpEnd&lt;/b&gt; : 시작/종료일 선택 컨트롤&lt;/li&gt;
&lt;/ul&gt;
&lt;hr data-end=&quot;1027&quot; data-start=&quot;1024&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h3 data-end=&quot;1064&quot; data-start=&quot;1029&quot; data-ke-size=&quot;size23&quot;&gt;2) &lt;b&gt;캘린더에 오늘/이번주 일정만 필터링해서 보기&lt;/b&gt;&lt;/h3&gt;
&lt;div&gt;
&lt;div&gt;
&lt;pre id=&quot;code_1749017320392&quot; class=&quot;python&quot; data-ke-language=&quot;python&quot; data-ke-type=&quot;codeblock&quot;&gt;&lt;code&gt;// Gallery 또는 캘린더 뷰 Items
Filter(
    CalendarEvents,
    StartDateTime &amp;gt;= Today() &amp;amp;&amp;amp; StartDateTime &amp;lt; Today() + 7
)&lt;/code&gt;&lt;/pre&gt;
&lt;/div&gt;
&lt;/div&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;1213&quot; data-start=&quot;1196&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;1213&quot; data-start=&quot;1196&quot;&gt;&lt;b&gt;이번주 일정만 필터링&lt;/b&gt;&lt;/li&gt;
&lt;/ul&gt;
&lt;hr data-end=&quot;1218&quot; data-start=&quot;1215&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h3 data-end=&quot;1255&quot; data-start=&quot;1220&quot; data-ke-size=&quot;size23&quot;&gt;3) &lt;b&gt;남은 D-Day(마감일까지 남은 일수) 표시&lt;/b&gt;&lt;/h3&gt;
&lt;div&gt;
&lt;div&gt;
&lt;pre id=&quot;code_1749017332132&quot; class=&quot;python&quot; data-ke-language=&quot;python&quot; data-ke-type=&quot;codeblock&quot;&gt;&lt;code&gt;// D-Day 라벨
&quot; D-&quot; &amp;amp; DateDiff(Today(), EndDateTime, Days)&lt;/code&gt;&lt;/pre&gt;
&lt;/div&gt;
&lt;/div&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;1364&quot; data-start=&quot;1328&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;1364&quot; data-start=&quot;1328&quot;&gt;마감이 가까울수록 색상/경고 아이콘 등 조건부 서식 추가 가능&lt;/li&gt;
&lt;/ul&gt;
&lt;hr data-end=&quot;1369&quot; data-start=&quot;1366&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;1391&quot; data-start=&quot;1371&quot; data-ke-size=&quot;size26&quot;&gt; ️ 일정 알림(자동, 수동)&lt;/h2&gt;
&lt;h3 data-end=&quot;1419&quot; data-start=&quot;1393&quot; data-ke-size=&quot;size23&quot;&gt;1) &lt;b&gt;알림 필요 일정 조건부 노출&lt;/b&gt;&lt;/h3&gt;
&lt;div&gt;
&lt;div&gt;
&lt;pre id=&quot;code_1749017341129&quot; class=&quot;python&quot; data-ke-language=&quot;python&quot; data-ke-type=&quot;codeblock&quot;&gt;&lt;code&gt;// 마감 임박(예: 3일 이내) 일정만 강조
If(
    EndDateTime &amp;lt;= Today() + 3 &amp;amp;&amp;amp; EndDateTime &amp;gt;= Today(),
    Color.Red,
    Color.Black
)&lt;/code&gt;&lt;/pre&gt;
&lt;/div&gt;
&lt;/div&gt;
&lt;h3 data-end=&quot;1581&quot; data-start=&quot;1557&quot; data-ke-size=&quot;size23&quot;&gt;2) &lt;b&gt;사용자 정의 알림 메시지&lt;/b&gt;&lt;/h3&gt;
&lt;div&gt;
&lt;div&gt;
&lt;pre id=&quot;code_1749017346213&quot; class=&quot;python&quot; data-ke-language=&quot;python&quot; data-ke-type=&quot;codeblock&quot;&gt;&lt;code&gt;// 오늘 일정이 있을 때 팝업 알림
If(
    CountRows(Filter(CalendarEvents, StartDateTime = Today())) &amp;gt; 0,
    Notify(&quot;오늘 등록된 일정이 있습니다.&quot;, NotificationType.Information)
)&lt;/code&gt;&lt;/pre&gt;
&lt;/div&gt;
&lt;/div&gt;
&lt;hr data-end=&quot;1757&quot; data-start=&quot;1754&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h3 data-end=&quot;1771&quot; data-start=&quot;1759&quot; data-ke-size=&quot;size23&quot;&gt;함수/속성 설명&lt;/h3&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;1901&quot; data-start=&quot;1773&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;1794&quot; data-start=&quot;1773&quot;&gt;&lt;b&gt;Patch&lt;/b&gt; : 새 일정 추가&lt;/li&gt;
&lt;li data-end=&quot;1822&quot; data-start=&quot;1795&quot;&gt;&lt;b&gt;Filter&lt;/b&gt; : 특정 날짜 범위만 표시&lt;/li&gt;
&lt;li data-end=&quot;1855&quot; data-start=&quot;1823&quot;&gt;&lt;b&gt;DateDiff&lt;/b&gt; : 남은 일수(D-Day) 계산&lt;/li&gt;
&lt;li data-end=&quot;1877&quot; data-start=&quot;1856&quot;&gt;&lt;b&gt;Today()&lt;/b&gt; : 오늘 날짜&lt;/li&gt;
&lt;li data-end=&quot;1901&quot; data-start=&quot;1878&quot;&gt;&lt;b&gt;Notify&lt;/b&gt; : 팝업 알림 표시&lt;/li&gt;
&lt;/ul&gt;
&lt;hr data-end=&quot;1906&quot; data-start=&quot;1903&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;1919&quot; data-start=&quot;1908&quot; data-ke-size=&quot;size26&quot;&gt;실무 활용 예시&lt;/h2&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;2000&quot; data-start=&quot;1921&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;1945&quot; data-start=&quot;1921&quot;&gt;사내 회의실 예약, 회의 일정 자동 관리&lt;/li&gt;
&lt;li data-end=&quot;1970&quot; data-start=&quot;1946&quot;&gt;프로젝트 마감 일정 추적 및 실시간 알림&lt;/li&gt;
&lt;li data-end=&quot;2000&quot; data-start=&quot;1971&quot;&gt;팀원별 할 일(To-Do), 반복/공유 일정 관리&lt;/li&gt;
&lt;/ul&gt;
&lt;hr data-end=&quot;2005&quot; data-start=&quot;2002&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;2014&quot; data-start=&quot;2007&quot; data-ke-size=&quot;size26&quot;&gt;실무 팁&lt;/h2&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;2162&quot; data-start=&quot;2016&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;2074&quot; data-start=&quot;2016&quot;&gt;CalendarEvents 테이블엔 Start/EndDateTime, 담당자 등 필수 필드를 꼭 포함&lt;/li&gt;
&lt;li data-end=&quot;2123&quot; data-start=&quot;2075&quot;&gt;반복 일정, 예약 충돌 방지는 추가 로직(Patch 전에 중복 체크)으로 확장 가능&lt;/li&gt;
&lt;li data-end=&quot;2162&quot; data-start=&quot;2124&quot;&gt;일정 상세 페이지, 팝업 등으로 UX를 꾸미면 활용도가 높아집니다&lt;/li&gt;
&lt;/ul&gt;
&lt;hr data-end=&quot;2167&quot; data-start=&quot;2164&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;2175&quot; data-start=&quot;2169&quot; data-ke-size=&quot;size26&quot;&gt;마무리&lt;/h2&gt;
&lt;p data-end=&quot;2321&quot; data-start=&quot;2177&quot; data-ke-size=&quot;size16&quot;&gt;캘린더와 일정 관리 기능은&lt;br /&gt;거의 모든 실무 Power Apps 앱에 적용할 수 있는 핵심 유틸리티입니다.&lt;br /&gt;Power FX의 Patch, Filter, DateDiff, Notify 함수만 익혀도&lt;br /&gt;직접 일정을 추가/관리/알림까지 구현할 수 있습니다.&lt;/p&gt;
&lt;p data-end=&quot;2416&quot; data-start=&quot;2343&quot; data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;</description>
      <category>Programming/Power Apps(PowerFx)</category>
      <category>datediff</category>
      <category>notify</category>
      <category>patch</category>
      <category>powerapps</category>
      <category>powerfx</category>
      <category>일정관리</category>
      <category>캘린더</category>
      <author>Allen93</author>
      <guid isPermaLink="true">https://allensdatablog.tistory.com/438</guid>
      <comments>https://allensdatablog.tistory.com/entry/%E2%9A%A1-Power-FX-%EC%8B%A4%EC%A0%84-%E2%80%94-%EC%95%B1-%EB%82%B4-%EC%9D%BC%EC%A0%95-%EA%B4%80%EB%A6%AC-%EC%BA%98%EB%A6%B0%EB%8D%94-%EB%B0%8F-%EC%9D%BC%EC%A0%95-%EC%95%8C%EB%A6%BC-%EA%B5%AC%ED%98%84%EB%B2%95#entry438comment</comments>
      <pubDate>Tue, 9 Sep 2025 16:11:02 +0900</pubDate>
    </item>
    <item>
      <title>⚡ Power FX 실전 &amp;mdash; 오류 로깅 및 사용자 피드백 데이터 자동 수집</title>
      <link>https://allensdatablog.tistory.com/entry/%E2%9A%A1-Power-FX-%EC%8B%A4%EC%A0%84-%E2%80%94-%EC%98%A4%EB%A5%98-%EB%A1%9C%EA%B9%85-%EB%B0%8F-%EC%82%AC%EC%9A%A9%EC%9E%90-%ED%94%BC%EB%93%9C%EB%B0%B1-%EB%8D%B0%EC%9D%B4%ED%84%B0-%EC%9E%90%EB%8F%99-%EC%88%98%EC%A7%91</link>
      <description>&lt;blockquote data-end=&quot;196&quot; data-start=&quot;45&quot; data-ke-style=&quot;style1&quot;&gt;&lt;span style=&quot;font-family: 'Noto Serif KR';&quot;&gt;이번 포스트에선 Power Apps에서 사용자 오류, 예외 상황, 피드백 데이터를 자동으로 수집하고 기록하는 방법을 정리합니다.&lt;/span&gt;&lt;br /&gt;&lt;span style=&quot;font-family: 'Noto Serif KR';&quot;&gt;앱이 배포된 후에도 실제 사용자 행동과 문제점을 실시간으로 파악할 수 있어,&lt;/span&gt;&lt;br /&gt;&lt;span style=&quot;font-family: 'Noto Serif KR';&quot;&gt;지속적인 품질 개선과 빠른 이슈 대응에 매우 효과적입니다.&lt;/span&gt;&lt;/blockquote&gt;
&lt;hr data-end=&quot;201&quot; data-start=&quot;198&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;219&quot; data-start=&quot;203&quot; data-ke-size=&quot;size26&quot;&gt; ️ 오류 로깅 자동화&lt;/h2&gt;
&lt;h3 data-end=&quot;257&quot; data-start=&quot;221&quot; data-ke-size=&quot;size23&quot;&gt;1) &lt;b&gt;오류 발생 시 로그 데이터 테이블에 자동 저장&lt;/b&gt;&lt;/h3&gt;
&lt;div&gt;
&lt;div&gt;
&lt;pre id=&quot;code_1749016799330&quot; class=&quot;python&quot; data-ke-language=&quot;python&quot; data-ke-type=&quot;codeblock&quot;&gt;&lt;code&gt;// 예: 저장 실패 시 오류 내용 로그 기록
If(
    IsBlank(TextInput1.Text),
    Patch(
        ErrorLogs,
        Defaults(ErrorLogs),
        {
            UserEmail: User().Email,
            ErrorMsg: &quot;필수 입력값 누락&quot;,
            ErrorTime: Now()
        }
    );
    Notify(&quot;필수 값을 입력하세요.&quot;, NotificationType.Error)
)&lt;/code&gt;&lt;/pre&gt;
&lt;/div&gt;
&lt;/div&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;722&quot; data-start=&quot;573&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;640&quot; data-start=&quot;573&quot;&gt;&lt;b&gt;ErrorLogs&lt;/b&gt; : 오류 로그 기록용 데이터 테이블(SharePoint, Dataverse, Excel 등)&lt;/li&gt;
&lt;li data-end=&quot;674&quot; data-start=&quot;641&quot;&gt;&lt;b&gt;Patch&lt;/b&gt; : 새 오류 로그를 데이터 소스에 추가&lt;/li&gt;
&lt;li data-end=&quot;722&quot; data-start=&quot;675&quot;&gt;&lt;b&gt;User().Email, Now()&lt;/b&gt; : 오류 발생 시점과 사용자 정보 기록&lt;/li&gt;
&lt;/ul&gt;
&lt;hr data-end=&quot;727&quot; data-start=&quot;724&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h3 data-end=&quot;761&quot; data-start=&quot;729&quot; data-ke-size=&quot;size23&quot;&gt;2) &lt;b&gt;앱 전역에서 공통 오류 기록 함수 활용&lt;/b&gt;&lt;/h3&gt;
&lt;div&gt;
&lt;div&gt;
&lt;pre id=&quot;code_1749016815350&quot; class=&quot;python&quot; data-ke-language=&quot;python&quot; data-ke-type=&quot;codeblock&quot;&gt;&lt;code&gt;// 오류 기록용 사용자 정의 함수(App &amp;gt; Components 등)
SetErrorLog(ErrorMsg) =
    Patch(
        ErrorLogs,
        Defaults(ErrorLogs),
        {
            UserEmail: User().Email,
            ErrorMsg: ErrorMsg,
            ErrorTime: Now()
        }
    )&lt;/code&gt;&lt;/pre&gt;
&lt;/div&gt;
&lt;/div&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;1061&quot; data-start=&quot;1024&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;1061&quot; data-start=&quot;1024&quot;&gt;&lt;b&gt;필요할 때마다 SetErrorLog(&quot;에러 내용&quot;) 호출&lt;/b&gt;&lt;/li&gt;
&lt;/ul&gt;
&lt;hr data-end=&quot;1066&quot; data-start=&quot;1063&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;1088&quot; data-start=&quot;1068&quot; data-ke-size=&quot;size26&quot;&gt; ️ 사용자 피드백 자동 수집&lt;/h2&gt;
&lt;h3 data-end=&quot;1119&quot; data-start=&quot;1090&quot; data-ke-size=&quot;size23&quot;&gt;1) &lt;b&gt;사용자 평가/피드백 입력 폼 제공&lt;/b&gt;&lt;/h3&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;1186&quot; data-start=&quot;1120&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;1149&quot; data-start=&quot;1120&quot;&gt;앱 하단/설정 메뉴에 &amp;lsquo;피드백 남기기&amp;rsquo; 버튼 배치&lt;/li&gt;
&lt;li data-end=&quot;1186&quot; data-start=&quot;1150&quot;&gt;TextInput, Dropdown 등으로 평가/의견 입력받기&lt;/li&gt;
&lt;/ul&gt;
&lt;h3 data-end=&quot;1211&quot; data-start=&quot;1188&quot; data-ke-size=&quot;size23&quot;&gt;2) &lt;b&gt;피드백 저장 코드 예시&lt;/b&gt;&lt;/h3&gt;
&lt;div&gt;
&lt;div&gt;
&lt;pre id=&quot;code_1749016821959&quot; class=&quot;python&quot; data-ke-language=&quot;python&quot; data-ke-type=&quot;codeblock&quot;&gt;&lt;code&gt;// btnSubmitFeedback.OnSelect
Patch(
    Feedbacks,
    Defaults(Feedbacks),
    {
        UserEmail: User().Email,
        FeedbackText: txtFeedback.Text,
        FeedbackTime: Now(),
        FeedbackType: ddFeedbackType.Selected.Value
    }
);
Notify(&quot;소중한 의견이 저장되었습니다.&quot;, NotificationType.Success)&lt;/code&gt;&lt;/pre&gt;
&lt;/div&gt;
&lt;/div&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;1638&quot; data-start=&quot;1526&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;1558&quot; data-start=&quot;1526&quot;&gt;&lt;b&gt;Feedbacks&lt;/b&gt; : 피드백 기록 데이터 테이블&lt;/li&gt;
&lt;li data-end=&quot;1586&quot; data-start=&quot;1559&quot;&gt;&lt;b&gt;txtFeedback&lt;/b&gt; : 피드백 입력란&lt;/li&gt;
&lt;li data-end=&quot;1638&quot; data-start=&quot;1587&quot;&gt;&lt;b&gt;ddFeedbackType&lt;/b&gt; : 피드백 종류 선택(예: 개선사항, 버그, 칭찬 등)&lt;/li&gt;
&lt;/ul&gt;
&lt;hr data-end=&quot;1643&quot; data-start=&quot;1640&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h3 data-end=&quot;1657&quot; data-start=&quot;1645&quot; data-ke-size=&quot;size23&quot;&gt;함수/속성 설명&lt;/h3&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;1795&quot; data-start=&quot;1659&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;1717&quot; data-start=&quot;1659&quot;&gt;&lt;b&gt;Patch(테이블, Defaults(테이블), {필드:값})&lt;/b&gt; : 새 레코드(오류/피드백) 추가&lt;/li&gt;
&lt;li data-end=&quot;1758&quot; data-start=&quot;1718&quot;&gt;&lt;b&gt;User().Email, Now()&lt;/b&gt; : 사용자/시간 자동 기록&lt;/li&gt;
&lt;li data-end=&quot;1795&quot; data-start=&quot;1759&quot;&gt;&lt;b&gt;Notify(메시지, 타입)&lt;/b&gt; : 저장 결과 실시간 안내&lt;/li&gt;
&lt;/ul&gt;
&lt;hr data-end=&quot;1800&quot; data-start=&quot;1797&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;1813&quot; data-start=&quot;1802&quot; data-ke-size=&quot;size26&quot;&gt;실무 활용 예시&lt;/h2&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;1929&quot; data-start=&quot;1815&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;1850&quot; data-start=&quot;1815&quot;&gt;예상치 못한 입력 오류, 저장 실패 등 사용자 경험 모니터링&lt;/li&gt;
&lt;li data-end=&quot;1890&quot; data-start=&quot;1851&quot;&gt;버그, 개선 요청 등 앱 내부 피드백의 정량/정성 데이터 자동 수집&lt;/li&gt;
&lt;li data-end=&quot;1929&quot; data-start=&quot;1891&quot;&gt;정기적으로 로그/피드백 테이블 점검 &amp;rarr; 앱 개선/QA 보고서 작성&lt;/li&gt;
&lt;/ul&gt;
&lt;hr data-end=&quot;1934&quot; data-start=&quot;1931&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;1943&quot; data-start=&quot;1936&quot; data-ke-size=&quot;size26&quot;&gt;실무 팁&lt;/h2&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;2113&quot; data-start=&quot;1945&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;2012&quot; data-start=&quot;1945&quot;&gt;ErrorLogs/Feedbacks 테이블은 최소한 UserEmail, 날짜/시간, 상세 내용 필드를 꼭 포함하세요.&lt;/li&gt;
&lt;li data-end=&quot;2047&quot; data-start=&quot;2013&quot;&gt;사용자 개인정보 보호와 보안 정책을 사내 기준에 맞게 설정&lt;/li&gt;
&lt;li data-end=&quot;2113&quot; data-start=&quot;2048&quot;&gt;수집된 로그와 피드백 데이터는 Power BI 등으로 대시보드화하면&lt;br /&gt;운영팀/기획자와 실시간 공유가 가능합니다.&lt;/li&gt;
&lt;/ul&gt;
&lt;hr data-end=&quot;2118&quot; data-start=&quot;2115&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;2126&quot; data-start=&quot;2120&quot; data-ke-size=&quot;size26&quot;&gt;마무리&lt;/h2&gt;
&lt;p data-end=&quot;2260&quot; data-start=&quot;2128&quot; data-ke-size=&quot;size16&quot;&gt;오류 로깅과 피드백 자동 수집 기능을 넣어두면&lt;br /&gt;배포 후에도 사용자 문제를 빠르게 확인&amp;middot;개선할 수 있습니다.&lt;br /&gt;Power FX의 Patch, User, Now 등 기본 함수만으로도&lt;br /&gt;효과적인 앱 품질 관리 체계를 만들 수 있습니다.&lt;/p&gt;
&lt;p data-end=&quot;2354&quot; data-start=&quot;2282&quot; data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;</description>
      <category>Programming/Power Apps(PowerFx)</category>
      <category>errorlogs</category>
      <category>patch</category>
      <category>powerapps</category>
      <category>powerfx</category>
      <category>오류로깅</category>
      <category>피드백</category>
      <author>Allen93</author>
      <guid isPermaLink="true">https://allensdatablog.tistory.com/437</guid>
      <comments>https://allensdatablog.tistory.com/entry/%E2%9A%A1-Power-FX-%EC%8B%A4%EC%A0%84-%E2%80%94-%EC%98%A4%EB%A5%98-%EB%A1%9C%EA%B9%85-%EB%B0%8F-%EC%82%AC%EC%9A%A9%EC%9E%90-%ED%94%BC%EB%93%9C%EB%B0%B1-%EB%8D%B0%EC%9D%B4%ED%84%B0-%EC%9E%90%EB%8F%99-%EC%88%98%EC%A7%91#entry437comment</comments>
      <pubDate>Fri, 5 Sep 2025 16:02:00 +0900</pubDate>
    </item>
    <item>
      <title>⚡ Power FX 실전 &amp;mdash; 알림, 팝업, 인터랙션으로 사용자 경험(UX) 개선하기</title>
      <link>https://allensdatablog.tistory.com/entry/%E2%9A%A1-Power-FX-%EC%8B%A4%EC%A0%84-%E2%80%94-%EC%95%8C%EB%A6%BC-%ED%8C%9D%EC%97%85-%EC%9D%B8%ED%84%B0%EB%9E%99%EC%85%98%EC%9C%BC%EB%A1%9C-%EC%82%AC%EC%9A%A9%EC%9E%90-%EA%B2%BD%ED%97%98UX-%EA%B0%9C%EC%84%A0%ED%95%98%EA%B8%B0</link>
      <description>&lt;blockquote data-end=&quot;206&quot; data-start=&quot;50&quot; data-ke-style=&quot;style1&quot;&gt;&lt;span style=&quot;font-family: 'Noto Serif KR';&quot;&gt;이번 포스트에선 Power Apps에서 사용자 경험(UX)을 한 단계 높여주는&lt;/span&gt;&lt;br /&gt;&lt;span style=&quot;font-family: 'Noto Serif KR';&quot;&gt;알림(Notify), 팝업(Modal), 인터랙션(애니메이션/상태 전환 등) 구현 방법을 정리합니다.&lt;/span&gt;&lt;br /&gt;&lt;span style=&quot;font-family: 'Noto Serif KR';&quot;&gt;작지만 확실한 변화로, 사용자가 앱을 더 직관적이고 재미있게 사용할 수 있도록 만들어보세요.&lt;/span&gt;&lt;/blockquote&gt;
&lt;hr data-end=&quot;211&quot; data-start=&quot;208&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;237&quot; data-start=&quot;213&quot; data-ke-size=&quot;size26&quot;&gt; ️ 실시간 알림(Notify) 활용&lt;/h2&gt;
&lt;h3 data-end=&quot;269&quot; data-start=&quot;239&quot; data-ke-size=&quot;size23&quot;&gt;1) &lt;b&gt;저장/삭제/오류 등 작업 결과 안내&lt;/b&gt;&lt;/h3&gt;
&lt;div&gt;
&lt;div&gt;
&lt;pre id=&quot;code_1749016572179&quot; class=&quot;python&quot; data-ke-language=&quot;python&quot; data-ke-type=&quot;codeblock&quot;&gt;&lt;code&gt;// 저장 버튼 OnSelect
If(
    !IsBlank(TextInput1.Text),
    Notify(&quot;저장 완료!&quot;, NotificationType.Success),
    Notify(&quot;필수 값을 입력하세요.&quot;, NotificationType.Error)
)&lt;/code&gt;&lt;/pre&gt;
&lt;/div&gt;
&lt;/div&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;499&quot; data-start=&quot;439&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;499&quot; data-start=&quot;439&quot;&gt;&lt;b&gt;Notify(메시지, 타입)&lt;/b&gt; : 앱 화면 상단에 Success/Error/Info 등 메시지 팝업&lt;/li&gt;
&lt;/ul&gt;
&lt;hr data-end=&quot;504&quot; data-start=&quot;501&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;529&quot; data-start=&quot;506&quot; data-ke-size=&quot;size26&quot;&gt; ️ 팝업(Modal) 창 구현하기&lt;/h2&gt;
&lt;h3 data-end=&quot;560&quot; data-start=&quot;531&quot; data-ke-size=&quot;size23&quot;&gt;1) &lt;b&gt;팝업 노출/숨김 제어용 로컬 변수&lt;/b&gt;&lt;/h3&gt;
&lt;div&gt;
&lt;div&gt;
&lt;pre id=&quot;code_1749016584757&quot; class=&quot;python&quot; data-ke-language=&quot;python&quot; data-ke-type=&quot;codeblock&quot;&gt;&lt;code&gt;// 팝업 열기 버튼 OnSelect
UpdateContext({showPopup: true})

// 팝업 닫기 버튼 OnSelect
UpdateContext({showPopup: false})

// 팝업 카드(컨테이너)의 Visible 속성
showPopup&lt;/code&gt;&lt;/pre&gt;
&lt;/div&gt;
&lt;/div&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;753&quot; data-start=&quot;724&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;753&quot; data-start=&quot;724&quot;&gt;&lt;b&gt;showPopup&lt;/b&gt; : 팝업 표시 여부 제어&lt;/li&gt;
&lt;/ul&gt;
&lt;hr data-end=&quot;758&quot; data-start=&quot;755&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h3 data-end=&quot;799&quot; data-start=&quot;760&quot; data-ke-size=&quot;size23&quot;&gt;2) &lt;b&gt;팝업 안에 안내문구, 확인/취소 버튼 등 자유 배치&lt;/b&gt;&lt;/h3&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;878&quot; data-start=&quot;800&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;844&quot; data-start=&quot;800&quot;&gt;사용자가 중요한 결정(삭제, 전송 등) 전 재확인하게 만들면 오류 방지 효과&lt;/li&gt;
&lt;li data-end=&quot;878&quot; data-start=&quot;845&quot;&gt;팝업 내 Notify로 안내 메시지를 함께 띄워도 효과적&lt;/li&gt;
&lt;/ul&gt;
&lt;hr data-end=&quot;883&quot; data-start=&quot;880&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;912&quot; data-start=&quot;885&quot; data-ke-size=&quot;size26&quot;&gt; ️ 버튼, 아이콘 등 인터랙션 효과 적용&lt;/h2&gt;
&lt;h3 data-end=&quot;955&quot; data-start=&quot;914&quot; data-ke-size=&quot;size23&quot;&gt;1) &lt;b&gt;Hover, Pressed 등 상태별 색상/아이콘 변경&lt;/b&gt;&lt;/h3&gt;
&lt;div&gt;
&lt;div&gt;
&lt;pre id=&quot;code_1749016592956&quot; class=&quot;python&quot; data-ke-language=&quot;python&quot; data-ke-type=&quot;codeblock&quot;&gt;&lt;code&gt;// Button.Fill
If(
    Self.Pressed,
    Color.LightGray,
    If(
        Self.Hover,
        Color.SkyBlue,
        Color.White
    )
)&lt;/code&gt;&lt;/pre&gt;
&lt;/div&gt;
&lt;/div&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;1161&quot; data-start=&quot;1108&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;1161&quot; data-start=&quot;1108&quot;&gt;&lt;b&gt;Self.Pressed, Self.Hover&lt;/b&gt; : 버튼의 현재 상태(눌림/마우스 오버)&lt;/li&gt;
&lt;/ul&gt;
&lt;hr data-end=&quot;1166&quot; data-start=&quot;1163&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h3 data-end=&quot;1197&quot; data-start=&quot;1168&quot; data-ke-size=&quot;size23&quot;&gt;2) &lt;b&gt;상태 전환에 애니메이션 느낌 주기&lt;/b&gt;&lt;/h3&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;1309&quot; data-start=&quot;1198&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;1250&quot; data-start=&quot;1198&quot;&gt;슬라이더, ProgressBar 등 Value 변동에 따라 색상/길이/배경색 동적으로 변경&lt;/li&gt;
&lt;li data-end=&quot;1309&quot; data-start=&quot;1251&quot;&gt;여러 상태(State)에 따라 Visible/Color/Fill 등을 조합해 자연스러운 인터랙션 가능&lt;/li&gt;
&lt;/ul&gt;
&lt;hr data-end=&quot;1314&quot; data-start=&quot;1311&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;1327&quot; data-start=&quot;1316&quot; data-ke-size=&quot;size26&quot;&gt;실무 활용 예시&lt;/h2&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;1464&quot; data-start=&quot;1329&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;1369&quot; data-start=&quot;1329&quot;&gt;저장&amp;middot;삭제 등 주요 작업 완료 시 Success/Error 알림 제공&lt;/li&gt;
&lt;li data-end=&quot;1411&quot; data-start=&quot;1370&quot;&gt;위험 작업(삭제 등)에는 팝업 재확인(Modal)으로 사용자 실수 방지&lt;/li&gt;
&lt;li data-end=&quot;1464&quot; data-start=&quot;1412&quot;&gt;버튼, 아이콘, 리스트 항목 등에 Hover/Pressed 상태별 컬러 변화로 클릭감 전달&lt;/li&gt;
&lt;/ul&gt;
&lt;hr data-end=&quot;1469&quot; data-start=&quot;1466&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;1478&quot; data-start=&quot;1471&quot; data-ke-size=&quot;size26&quot;&gt;실무 팁&lt;/h2&gt;
&lt;ul style=&quot;list-style-type: disc;&quot; data-end=&quot;1648&quot; data-start=&quot;1480&quot; data-ke-list-type=&quot;disc&quot;&gt;
&lt;li data-end=&quot;1557&quot; data-start=&quot;1480&quot;&gt;팝업 구현 시 화면 전체를 덮는 반투명 Rectangle + 카드 레이아웃 사용&lt;br /&gt;(화면 터치 시 팝업 닫기 기능도 함께 구현 가능)&lt;/li&gt;
&lt;li data-end=&quot;1607&quot; data-start=&quot;1558&quot;&gt;Notify는 짧고 명확한 메시지 사용, Success/Error/Info 색상 구분&lt;/li&gt;
&lt;li data-end=&quot;1648&quot; data-start=&quot;1608&quot;&gt;작은 인터랙션 효과도 꾸준히 추가하면 앱이 한층 &amp;ldquo;앱답게&amp;rdquo; 느껴집니다&lt;/li&gt;
&lt;/ul&gt;
&lt;hr data-end=&quot;1653&quot; data-start=&quot;1650&quot; data-ke-style=&quot;style1&quot; /&gt;
&lt;h2 data-end=&quot;1661&quot; data-start=&quot;1655&quot; data-ke-size=&quot;size26&quot;&gt;마무리&lt;/h2&gt;
&lt;p data-end=&quot;1790&quot; data-start=&quot;1663&quot; data-ke-size=&quot;size16&quot;&gt;알림, 팝업, 인터랙션 효과는&lt;br /&gt;단순한 데이터 입력 앱을 사용자 친화적이고 세련된 앱으로 업그레이드하는 핵심 요소입니다.&lt;br /&gt;Power FX의 기본 함수와 컨트롤 속성만 잘 활용해도&lt;br /&gt;누구나 쉽게 UX를 개선할 수 있습니다.&lt;/p&gt;
&lt;p data-end=&quot;1875&quot; data-start=&quot;1812&quot; data-ke-size=&quot;size16&quot;&gt;&amp;nbsp;&lt;/p&gt;</description>
      <category>Programming/Power Apps(PowerFx)</category>
      <category>powerapps</category>
      <category>powerfx</category>
      <category>알림</category>
      <category>인터랙션</category>
      <category>팝업</category>
      <author>Allen93</author>
      <guid isPermaLink="true">https://allensdatablog.tistory.com/436</guid>
      <comments>https://allensdatablog.tistory.com/entry/%E2%9A%A1-Power-FX-%EC%8B%A4%EC%A0%84-%E2%80%94-%EC%95%8C%EB%A6%BC-%ED%8C%9D%EC%97%85-%EC%9D%B8%ED%84%B0%EB%9E%99%EC%85%98%EC%9C%BC%EB%A1%9C-%EC%82%AC%EC%9A%A9%EC%9E%90-%EA%B2%BD%ED%97%98UX-%EA%B0%9C%EC%84%A0%ED%95%98%EA%B8%B0#entry436comment</comments>
      <pubDate>Mon, 1 Sep 2025 15:56:55 +0900</pubDate>
    </item>
  </channel>
</rss>