{"id":3538,"date":"2025-06-28T07:59:39","date_gmt":"2025-06-27T23:59:39","guid":{"rendered":"http:\/\/viplao.com\/?p=3538"},"modified":"2025-06-28T13:39:27","modified_gmt":"2025-06-28T05:39:27","slug":"%e3%80%90python%e5%ae%9e%e8%b7%b5%e7%bb%8f%e9%aa%8c%e3%80%91%e7%94%b5%e5%95%86%e5%b9%b3%e5%8f%b0%e9%94%80%e5%94%ae%e6%95%b0%e6%8d%ae%e5%88%86%e6%9e%90%e5%ae%9e%e8%b7%b5%e5%88%86%e8%a7%a3","status":"publish","type":"post","link":"http:\/\/viplao.com\/index.php\/2025\/06\/28\/%e3%80%90python%e5%ae%9e%e8%b7%b5%e7%bb%8f%e9%aa%8c%e3%80%91%e7%94%b5%e5%95%86%e5%b9%b3%e5%8f%b0%e9%94%80%e5%94%ae%e6%95%b0%e6%8d%ae%e5%88%86%e6%9e%90%e5%ae%9e%e8%b7%b5%e5%88%86%e8%a7%a3\/","title":{"rendered":"\u3010Python10\u5e74\u7ecf\u9a8c\u603b\u7ed3\u3011\u7b2c\u4e09\u8bfe \u7535\u5546\u5e73\u53f0\u9500\u552e\u6570\u636e\u5206\u6790\u5b9e\u8df5\u5206\u89e3 \u2013 \u6570\u636e\u8f6c\u6362\uff08Data Transformation\uff09"},"content":{"rendered":"\n<p>\u5e38\u89c1\u7528\u7684\u6570\u636e\u8f6c\u6362\u5206\u7c7b\uff1a<\/p>\n\n\n\n<ol>\n<li>\u63d0\u53d6\u65e5\u671f\u4e2d\u7684\u5e74\u3001\u6708\u3001\u5468\u3001\u661f\u671f\u51e0<\/li>\n\n\n\n<li>\u5c06\u5b57\u7b26\u4e32\u5206\u7c7b\u53d8\u91cf\u7f16\u7801\u4e3a\u54d1\u53d8\u91cf\uff08One-Hot Encoding\uff09<\/li>\n\n\n\n<li>\u8ba1\u7b97\u8ba2\u5355\u603b\u91d1\u989d\uff08\u5355\u4ef7\u00d7\u6570\u91cf\uff09<\/li>\n\n\n\n<li>\u8ba1\u7b97\u6298\u6263\u7387\uff08\u5b9e\u9645\u652f\u4ed8\u4ef7 \/ \u539f\u4ef7\uff09<\/li>\n\n\n\n<li>\u6784\u9020\u7528\u6237\u8d2d\u4e70\u9891\u6b21\u7279\u5f81<\/li>\n\n\n\n<li>\u8f6c\u6362\u65f6\u95f4\u6233\u4e3a\u53ef\u6392\u5e8f\u7684\u65f6\u95f4\u5e8f\u5217<\/li>\n\n\n\n<li>\u6784\u9020\u5546\u54c1\u9500\u91cf\u6392\u540d\u5b57\u6bb5<\/li>\n\n\n\n<li>\u5408\u5e76\u591a\u4e2a\u6570\u636e\u6e90\u751f\u6210\u5bbd\u8868<\/li>\n\n\n\n<li>\u5bf9\u4ef7\u683c\u8fdb\u884c\u6807\u51c6\u5316\uff08Z-score\uff09<\/li>\n\n\n\n<li>\u6784\u9020\u662f\u5426\u53c2\u4e0e\u4fc3\u9500\u7684\u5e03\u5c14\u6807\u7b7e<\/li>\n<\/ol>\n\n\n\n<p>\u6211\u4eec\u5c06\u5c55\u793a\u5982\u4f55\u8fdb\u884c\u8fd9\u4e9b\u5e38\u89c1\u7684\u6570\u636e\u8f6c\u6362\u4efb\u52a1\u3002\u5047\u8bbe\u6211\u4eec\u6709\u4e00\u4e2a\u5305\u542b\u9500\u552e\u8ba2\u5355\u6570\u636e\u7684DataFrame\uff0c\u5e76\u9010\u6b65\u5e94\u7528\u8fd9\u4e9b\u8f6c\u6362\u64cd\u4f5c\u3002<\/p>\n\n\n\n<p>\u9996\u5148\uff0c\u8ba9\u6211\u4eec\u521b\u5efa\u4e00\u4e2a\u793a\u4f8bDataFrame\u6765\u6a21\u62df\u539f\u59cb\u6570\u636e\uff1a<\/p>\n\n\n\n<pre class=\"wp-block-code\"><code>import pandas as pd\nimport numpy as np\n\n# \u521b\u5efa\u793a\u4f8bDataFrame\ndata = {\n    'order_id': &#91;1, 2, 3, 4, 5, 6, 7, 8],\n    'product_id': &#91;'A001', 'B002', 'D004', 'E005', 'F006', 'G007', 'H008', 'I009'],\n    'category_code': &#91;'C1', 'C2', 'C1', 'C3', 'C4', 'C5', 'C6', 'C7'],\n    'amount': &#91;100.00, 200.00, 300.00, 400.00, 500.00, 600.00, 700.00, 800.00],\n    'original_price': &#91;120.00, 220.00, 320.00, 420.00, 520.00, 620.00, 720.00, 820.00],\n    'quantity': &#91;1, 2, 1, 1, 2, 1, 1, 2],\n    'order_date': &#91;'2025-06-01', '2025-06-02', '2025-06-03', '2025-06-04', '2025-06-05', '2025-06-06', '2025-06-07', '2025-06-08'],\n    'customer_id': &#91;101, 102, 103, 104, 105, 106, 107, 108],\n    'promotion': &#91;False, True, False, True, False, True, False, True]\n}\n\ndf = pd.DataFrame(data)\nprint(\"\u539f\u59cb\u6570\u636e:\")\nprint(df)<\/code><\/pre>\n\n\n\n<p>\u63a5\u4e0b\u6765\uff0c\u6211\u4eec\u5c06\u9010\u4e2a\u5904\u7406\u4e0a\u8ff0\u63d0\u5230\u7684\u6570\u636e\u8f6c\u6362\u4efb\u52a1\u3002<\/p>\n\n\n\n<div id=\"ez-toc-container\" class=\"ez-toc-v2_0_71 counter-hierarchy ez-toc-counter ez-toc-grey ez-toc-container-direction\">\n<div class=\"ez-toc-title-container\">\n<p class=\"ez-toc-title\" style=\"cursor:inherit\">\u6587\u7ae0\u76ee\u5f55<\/p>\n<span class=\"ez-toc-title-toggle\"><a href=\"#\" class=\"ez-toc-pull-right ez-toc-btn ez-toc-btn-xs ez-toc-btn-default ez-toc-toggle\" aria-label=\"Toggle Table of Content\"><span class=\"ez-toc-js-icon-con\"><span class=\"\"><span class=\"eztoc-hide\" style=\"display:none;\">Toggle<\/span><span class=\"ez-toc-icon-toggle-span\"><svg style=\"fill: #999;color:#999\" xmlns=\"http:\/\/www.w3.org\/2000\/svg\" class=\"list-377408\" width=\"20px\" height=\"20px\" viewBox=\"0 0 24 24\" fill=\"none\"><path d=\"M6 6H4v2h2V6zm14 0H8v2h12V6zM4 11h2v2H4v-2zm16 0H8v2h12v-2zM4 16h2v2H4v-2zm16 0H8v2h12v-2z\" fill=\"currentColor\"><\/path><\/svg><svg style=\"fill: #999;color:#999\" class=\"arrow-unsorted-368013\" xmlns=\"http:\/\/www.w3.org\/2000\/svg\" width=\"10px\" height=\"10px\" viewBox=\"0 0 24 24\" version=\"1.2\" baseProfile=\"tiny\"><path d=\"M18.2 9.3l-6.2-6.3-6.2 6.3c-.2.2-.3.4-.3.7s.1.5.3.7c.2.2.4.3.7.3h11c.3 0 .5-.1.7-.3.2-.2.3-.5.3-.7s-.1-.5-.3-.7zM5.8 14.7l6.2 6.3 6.2-6.3c.2-.2.3-.5.3-.7s-.1-.5-.3-.7c-.2-.2-.4-.3-.7-.3h-11c-.3 0-.5.1-.7.3-.2.2-.3.5-.3.7s.1.5.3.7z\"\/><\/svg><\/span><\/span><\/span><\/a><\/span><\/div>\n<nav><ul class='ez-toc-list ez-toc-list-level-1 eztoc-toggle-hide-by-default' ><li class='ez-toc-page-1 ez-toc-heading-level-3'><a class=\"ez-toc-link ez-toc-heading-1\" href=\"http:\/\/viplao.com\/index.php\/2025\/06\/28\/%e3%80%90python%e5%ae%9e%e8%b7%b5%e7%bb%8f%e9%aa%8c%e3%80%91%e7%94%b5%e5%95%86%e5%b9%b3%e5%8f%b0%e9%94%80%e5%94%ae%e6%95%b0%e6%8d%ae%e5%88%86%e6%9e%90%e5%ae%9e%e8%b7%b5%e5%88%86%e8%a7%a3\/#1_%E6%8F%90%E5%8F%96%E6%97%A5%E6%9C%9F%E4%B8%AD%E7%9A%84%E5%B9%B4%E3%80%81%E6%9C%88%E3%80%81%E5%91%A8%E3%80%81%E6%98%9F%E6%9C%9F%E5%87%A0\" title=\"1. \u63d0\u53d6\u65e5\u671f\u4e2d\u7684\u5e74\u3001\u6708\u3001\u5468\u3001\u661f\u671f\u51e0\">1. \u63d0\u53d6\u65e5\u671f\u4e2d\u7684\u5e74\u3001\u6708\u3001\u5468\u3001\u661f\u671f\u51e0<\/a><\/li><li class='ez-toc-page-1 ez-toc-heading-level-3'><a class=\"ez-toc-link ez-toc-heading-2\" href=\"http:\/\/viplao.com\/index.php\/2025\/06\/28\/%e3%80%90python%e5%ae%9e%e8%b7%b5%e7%bb%8f%e9%aa%8c%e3%80%91%e7%94%b5%e5%95%86%e5%b9%b3%e5%8f%b0%e9%94%80%e5%94%ae%e6%95%b0%e6%8d%ae%e5%88%86%e6%9e%90%e5%ae%9e%e8%b7%b5%e5%88%86%e8%a7%a3\/#2_%E5%B0%86%E5%AD%97%E7%AC%A6%E4%B8%B2%E5%88%86%E7%B1%BB%E5%8F%98%E9%87%8F%E7%BC%96%E7%A0%81%E4%B8%BA%E5%93%91%E5%8F%98%E9%87%8F%EF%BC%88One-Hot_Encoding%EF%BC%89\" title=\"2. \u5c06\u5b57\u7b26\u4e32\u5206\u7c7b\u53d8\u91cf\u7f16\u7801\u4e3a\u54d1\u53d8\u91cf\uff08One-Hot Encoding\uff09\">2. \u5c06\u5b57\u7b26\u4e32\u5206\u7c7b\u53d8\u91cf\u7f16\u7801\u4e3a\u54d1\u53d8\u91cf\uff08One-Hot Encoding\uff09<\/a><\/li><li class='ez-toc-page-1 ez-toc-heading-level-3'><a class=\"ez-toc-link ez-toc-heading-3\" href=\"http:\/\/viplao.com\/index.php\/2025\/06\/28\/%e3%80%90python%e5%ae%9e%e8%b7%b5%e7%bb%8f%e9%aa%8c%e3%80%91%e7%94%b5%e5%95%86%e5%b9%b3%e5%8f%b0%e9%94%80%e5%94%ae%e6%95%b0%e6%8d%ae%e5%88%86%e6%9e%90%e5%ae%9e%e8%b7%b5%e5%88%86%e8%a7%a3\/#3_%E8%AE%A1%E7%AE%97%E8%AE%A2%E5%8D%95%E6%80%BB%E9%87%91%E9%A2%9D%EF%BC%88%E5%8D%95%E4%BB%B7%C3%97%E6%95%B0%E9%87%8F%EF%BC%89\" title=\"3. \u8ba1\u7b97\u8ba2\u5355\u603b\u91d1\u989d\uff08\u5355\u4ef7\u00d7\u6570\u91cf\uff09\">3. \u8ba1\u7b97\u8ba2\u5355\u603b\u91d1\u989d\uff08\u5355\u4ef7\u00d7\u6570\u91cf\uff09<\/a><\/li><li class='ez-toc-page-1 ez-toc-heading-level-3'><a class=\"ez-toc-link ez-toc-heading-4\" href=\"http:\/\/viplao.com\/index.php\/2025\/06\/28\/%e3%80%90python%e5%ae%9e%e8%b7%b5%e7%bb%8f%e9%aa%8c%e3%80%91%e7%94%b5%e5%95%86%e5%b9%b3%e5%8f%b0%e9%94%80%e5%94%ae%e6%95%b0%e6%8d%ae%e5%88%86%e6%9e%90%e5%ae%9e%e8%b7%b5%e5%88%86%e8%a7%a3\/#4_%E8%AE%A1%E7%AE%97%E6%8A%98%E6%89%A3%E7%8E%87%EF%BC%88%E5%AE%9E%E9%99%85%E6%94%AF%E4%BB%98%E4%BB%B7_%E5%8E%9F%E4%BB%B7%EF%BC%89\" title=\"4. \u8ba1\u7b97\u6298\u6263\u7387\uff08\u5b9e\u9645\u652f\u4ed8\u4ef7 \/ \u539f\u4ef7\uff09\">4. \u8ba1\u7b97\u6298\u6263\u7387\uff08\u5b9e\u9645\u652f\u4ed8\u4ef7 \/ \u539f\u4ef7\uff09<\/a><\/li><li class='ez-toc-page-1 ez-toc-heading-level-3'><a class=\"ez-toc-link ez-toc-heading-5\" href=\"http:\/\/viplao.com\/index.php\/2025\/06\/28\/%e3%80%90python%e5%ae%9e%e8%b7%b5%e7%bb%8f%e9%aa%8c%e3%80%91%e7%94%b5%e5%95%86%e5%b9%b3%e5%8f%b0%e9%94%80%e5%94%ae%e6%95%b0%e6%8d%ae%e5%88%86%e6%9e%90%e5%ae%9e%e8%b7%b5%e5%88%86%e8%a7%a3\/#5_%E6%9E%84%E9%80%A0%E7%94%A8%E6%88%B7%E8%B4%AD%E4%B9%B0%E9%A2%91%E6%AC%A1%E7%89%B9%E5%BE%81\" title=\"5. \u6784\u9020\u7528\u6237\u8d2d\u4e70\u9891\u6b21\u7279\u5f81\">5. \u6784\u9020\u7528\u6237\u8d2d\u4e70\u9891\u6b21\u7279\u5f81<\/a><\/li><li class='ez-toc-page-1 ez-toc-heading-level-3'><a class=\"ez-toc-link ez-toc-heading-6\" href=\"http:\/\/viplao.com\/index.php\/2025\/06\/28\/%e3%80%90python%e5%ae%9e%e8%b7%b5%e7%bb%8f%e9%aa%8c%e3%80%91%e7%94%b5%e5%95%86%e5%b9%b3%e5%8f%b0%e9%94%80%e5%94%ae%e6%95%b0%e6%8d%ae%e5%88%86%e6%9e%90%e5%ae%9e%e8%b7%b5%e5%88%86%e8%a7%a3\/#6_%E8%BD%AC%E6%8D%A2%E6%97%B6%E9%97%B4%E6%88%B3%E4%B8%BA%E5%8F%AF%E6%8E%92%E5%BA%8F%E7%9A%84%E6%97%B6%E9%97%B4%E5%BA%8F%E5%88%97\" title=\"6. \u8f6c\u6362\u65f6\u95f4\u6233\u4e3a\u53ef\u6392\u5e8f\u7684\u65f6\u95f4\u5e8f\u5217\">6. \u8f6c\u6362\u65f6\u95f4\u6233\u4e3a\u53ef\u6392\u5e8f\u7684\u65f6\u95f4\u5e8f\u5217<\/a><\/li><li class='ez-toc-page-1 ez-toc-heading-level-3'><a class=\"ez-toc-link ez-toc-heading-7\" href=\"http:\/\/viplao.com\/index.php\/2025\/06\/28\/%e3%80%90python%e5%ae%9e%e8%b7%b5%e7%bb%8f%e9%aa%8c%e3%80%91%e7%94%b5%e5%95%86%e5%b9%b3%e5%8f%b0%e9%94%80%e5%94%ae%e6%95%b0%e6%8d%ae%e5%88%86%e6%9e%90%e5%ae%9e%e8%b7%b5%e5%88%86%e8%a7%a3\/#7_%E6%9E%84%E9%80%A0%E5%95%86%E5%93%81%E9%94%80%E9%87%8F%E6%8E%92%E5%90%8D%E5%AD%97%E6%AE%B5\" title=\"7. \u6784\u9020\u5546\u54c1\u9500\u91cf\u6392\u540d\u5b57\u6bb5\">7. \u6784\u9020\u5546\u54c1\u9500\u91cf\u6392\u540d\u5b57\u6bb5<\/a><\/li><li class='ez-toc-page-1 ez-toc-heading-level-3'><a class=\"ez-toc-link ez-toc-heading-8\" href=\"http:\/\/viplao.com\/index.php\/2025\/06\/28\/%e3%80%90python%e5%ae%9e%e8%b7%b5%e7%bb%8f%e9%aa%8c%e3%80%91%e7%94%b5%e5%95%86%e5%b9%b3%e5%8f%b0%e9%94%80%e5%94%ae%e6%95%b0%e6%8d%ae%e5%88%86%e6%9e%90%e5%ae%9e%e8%b7%b5%e5%88%86%e8%a7%a3\/#8_%E5%AF%B9%E4%BB%B7%E6%A0%BC%E8%BF%9B%E8%A1%8C%E6%A0%87%E5%87%86%E5%8C%96%EF%BC%88Z-score%EF%BC%89\" title=\"8. \u5bf9\u4ef7\u683c\u8fdb\u884c\u6807\u51c6\u5316\uff08Z-score\uff09\">8. \u5bf9\u4ef7\u683c\u8fdb\u884c\u6807\u51c6\u5316\uff08Z-score\uff09<\/a><\/li><li class='ez-toc-page-1 ez-toc-heading-level-3'><a class=\"ez-toc-link ez-toc-heading-9\" href=\"http:\/\/viplao.com\/index.php\/2025\/06\/28\/%e3%80%90python%e5%ae%9e%e8%b7%b5%e7%bb%8f%e9%aa%8c%e3%80%91%e7%94%b5%e5%95%86%e5%b9%b3%e5%8f%b0%e9%94%80%e5%94%ae%e6%95%b0%e6%8d%ae%e5%88%86%e6%9e%90%e5%ae%9e%e8%b7%b5%e5%88%86%e8%a7%a3\/#9_%E6%9E%84%E9%80%A0%E6%98%AF%E5%90%A6%E5%8F%82%E4%B8%8E%E4%BF%83%E9%94%80%E7%9A%84%E5%B8%83%E5%B0%94%E6%A0%87%E7%AD%BE\" title=\"9. \u6784\u9020\u662f\u5426\u53c2\u4e0e\u4fc3\u9500\u7684\u5e03\u5c14\u6807\u7b7e\">9. \u6784\u9020\u662f\u5426\u53c2\u4e0e\u4fc3\u9500\u7684\u5e03\u5c14\u6807\u7b7e<\/a><\/li><\/ul><\/nav><\/div>\n<h3 class=\"wp-block-heading\"><span class=\"ez-toc-section\" id=\"1_%E6%8F%90%E5%8F%96%E6%97%A5%E6%9C%9F%E4%B8%AD%E7%9A%84%E5%B9%B4%E3%80%81%E6%9C%88%E3%80%81%E5%91%A8%E3%80%81%E6%98%9F%E6%9C%9F%E5%87%A0\"><\/span>1. \u63d0\u53d6\u65e5\u671f\u4e2d\u7684\u5e74\u3001\u6708\u3001\u5468\u3001\u661f\u671f\u51e0<span class=\"ez-toc-section-end\"><\/span><\/h3>\n\n\n\n<pre class=\"wp-block-code\"><code># \u8f6c\u6362order_date\u4e3a\u65e5\u671f\u683c\u5f0f\ndf&#91;'order_date'] = pd.to_datetime(df&#91;'order_date'])\n\n# \u63d0\u53d6\u5e74\u3001\u6708\u3001\u5468\u3001\u661f\u671f\u51e0\ndf&#91;'year'] = df&#91;'order_date'].dt.year\ndf&#91;'month'] = df&#91;'order_date'].dt.month\ndf&#91;'week_of_year'] = df&#91;'order_date'].dt.isocalendar().week.astype(int)\ndf&#91;'day_of_week'] = df&#91;'order_date'].dt.dayofweek\n\nprint(\"\\n\u63d0\u53d6\u65e5\u671f\u4e2d\u7684\u5e74\u3001\u6708\u3001\u5468\u3001\u661f\u671f\u51e0\u540e:\")\nprint(df)<\/code><\/pre>\n\n\n\n<h3 class=\"wp-block-heading\"><span class=\"ez-toc-section\" id=\"2_%E5%B0%86%E5%AD%97%E7%AC%A6%E4%B8%B2%E5%88%86%E7%B1%BB%E5%8F%98%E9%87%8F%E7%BC%96%E7%A0%81%E4%B8%BA%E5%93%91%E5%8F%98%E9%87%8F%EF%BC%88One-Hot_Encoding%EF%BC%89\"><\/span>2. \u5c06\u5b57\u7b26\u4e32\u5206\u7c7b\u53d8\u91cf\u7f16\u7801\u4e3a\u54d1\u53d8\u91cf\uff08One-Hot Encoding\uff09<span class=\"ez-toc-section-end\"><\/span><\/h3>\n\n\n\n<pre class=\"wp-block-code\"><code># \u5c06category_code\u8fdb\u884cone-hot encoding\ndf_encoded = pd.get_dummies(df, columns=&#91;'category_code'], prefix='cat')\n\nprint(\"\\n\u5c06\u5b57\u7b26\u4e32\u5206\u7c7b\u53d8\u91cf\u7f16\u7801\u4e3a\u54d1\u53d8\u91cf\u540e:\")\nprint(df_encoded)<\/code><\/pre>\n\n\n\n<h3 class=\"wp-block-heading\"><span class=\"ez-toc-section\" id=\"3_%E8%AE%A1%E7%AE%97%E8%AE%A2%E5%8D%95%E6%80%BB%E9%87%91%E9%A2%9D%EF%BC%88%E5%8D%95%E4%BB%B7%C3%97%E6%95%B0%E9%87%8F%EF%BC%89\"><\/span>3. \u8ba1\u7b97\u8ba2\u5355\u603b\u91d1\u989d\uff08\u5355\u4ef7\u00d7\u6570\u91cf\uff09<span class=\"ez-toc-section-end\"><\/span><\/h3>\n\n\n\n<pre class=\"wp-block-code\"><code># \u8ba1\u7b97\u8ba2\u5355\u603b\u91d1\u989d\ndf_encoded&#91;'total_amount'] = df_encoded&#91;'amount'] * df_encoded&#91;'quantity']\n\nprint(\"\\n\u8ba1\u7b97\u8ba2\u5355\u603b\u91d1\u989d\u540e:\")\nprint(df_encoded)<\/code><\/pre>\n\n\n\n<h3 class=\"wp-block-heading\"><span class=\"ez-toc-section\" id=\"4_%E8%AE%A1%E7%AE%97%E6%8A%98%E6%89%A3%E7%8E%87%EF%BC%88%E5%AE%9E%E9%99%85%E6%94%AF%E4%BB%98%E4%BB%B7_%E5%8E%9F%E4%BB%B7%EF%BC%89\"><\/span>4. \u8ba1\u7b97\u6298\u6263\u7387\uff08\u5b9e\u9645\u652f\u4ed8\u4ef7 \/ \u539f\u4ef7\uff09<span class=\"ez-toc-section-end\"><\/span><\/h3>\n\n\n\n<pre class=\"wp-block-code\"><code># \u8ba1\u7b97\u6298\u6263\u7387\ndf_encoded&#91;'discount_rate'] = (df_encoded&#91;'amount'] \/ df_encoded&#91;'original_price']).round(2)\n\nprint(\"\\n\u8ba1\u7b97\u6298\u6263\u7387\u540e:\")\nprint(df_encoded)<\/code><\/pre>\n\n\n\n<h3 class=\"wp-block-heading\"><span class=\"ez-toc-section\" id=\"5_%E6%9E%84%E9%80%A0%E7%94%A8%E6%88%B7%E8%B4%AD%E4%B9%B0%E9%A2%91%E6%AC%A1%E7%89%B9%E5%BE%81\"><\/span>5. \u6784\u9020\u7528\u6237\u8d2d\u4e70\u9891\u6b21\u7279\u5f81<span class=\"ez-toc-section-end\"><\/span><\/h3>\n\n\n\n<p>\u5047\u8bbe\u6211\u4eec\u6709\u4e00\u4e2a\u5ba2\u6237\u8d2d\u4e70\u8bb0\u5f55\u7684DataFrame\uff0c\u7528\u4e8e\u6784\u9020\u7528\u6237\u8d2d\u4e70\u9891\u6b21\u7279\u5f81\u3002<\/p>\n\n\n\n<pre class=\"wp-block-code\"><code># \u521b\u5efa\u5ba2\u6237\u8d2d\u4e70\u8bb0\u5f55\u7684DataFrame\npurchase_history = {\n    'customer_id': &#91;101, 102, 103, 104, 105, 106, 107, 108, 101, 102, 103, 104],\n    'purchase_count': &#91;2, 3, 1, 2, 1, 3, 2, 1, 1, 2, 1, 3]\n}\ndf_purchase_history = pd.DataFrame(purchase_history)\n\n# \u5408\u5e76\u5ba2\u6237\u8d2d\u4e70\u8bb0\u5f55\ndf_transformed = pd.merge(df_encoded, df_purchase_history, on='customer_id', how='left')\n\nprint(\"\\n\u6784\u9020\u7528\u6237\u8d2d\u4e70\u9891\u6b21\u7279\u5f81\u540e:\")\nprint(df_transformed)<\/code><\/pre>\n\n\n\n<h3 class=\"wp-block-heading\"><span class=\"ez-toc-section\" id=\"6_%E8%BD%AC%E6%8D%A2%E6%97%B6%E9%97%B4%E6%88%B3%E4%B8%BA%E5%8F%AF%E6%8E%92%E5%BA%8F%E7%9A%84%E6%97%B6%E9%97%B4%E5%BA%8F%E5%88%97\"><\/span>6. \u8f6c\u6362\u65f6\u95f4\u6233\u4e3a\u53ef\u6392\u5e8f\u7684\u65f6\u95f4\u5e8f\u5217<span class=\"ez-toc-section-end\"><\/span><\/h3>\n\n\n\n<p>\u5728\u6211\u4eec\u7684\u4f8b\u5b50\u4e2d\uff0c<code>order_date<\/code>\u5df2\u7ecf\u662f\u65e5\u671f\u65f6\u95f4\u683c\u5f0f\uff0c\u53ef\u4ee5\u76f4\u63a5\u6392\u5e8f\u3002<\/p>\n\n\n\n<pre class=\"wp-block-code\"><code># \u786e\u4fddorder_date\u662fdatetime\u7c7b\u578b\ndf_transformed&#91;'order_date'] = pd.to_datetime(df_transformed&#91;'order_date'])\n\n# \u6309order_date\u6392\u5e8f\ndf_sorted = df_transformed.sort_values(by='order_date')\n\nprint(\"\\n\u6309order_date\u6392\u5e8f\u540e:\")\nprint(df_sorted)<\/code><\/pre>\n\n\n\n<h3 class=\"wp-block-heading\"><span class=\"ez-toc-section\" id=\"7_%E6%9E%84%E9%80%A0%E5%95%86%E5%93%81%E9%94%80%E9%87%8F%E6%8E%92%E5%90%8D%E5%AD%97%E6%AE%B5\"><\/span>7. \u6784\u9020\u5546\u54c1\u9500\u91cf\u6392\u540d\u5b57\u6bb5<span class=\"ez-toc-section-end\"><\/span><\/h3>\n\n\n\n<p>\u5047\u8bbe\u6211\u4eec\u6709\u4e00\u4e2a\u5546\u54c1\u9500\u91cf\u7edf\u8ba1\u7684DataFrame\uff0c\u7528\u4e8e\u6784\u9020\u5546\u54c1\u9500\u91cf\u6392\u540d\u7279\u5f81\u3002<\/p>\n\n\n\n<pre class=\"wp-block-code\"><code># \u521b\u5efa\u5546\u54c1\u9500\u91cf\u7edf\u8ba1\u7684DataFrame\nproduct_sales = {\n    'product_id': &#91;'A001', 'B002', 'D004', 'E005', 'F006', 'G007', 'H008', 'I009'],\n    'sales_rank': &#91;1, 2, 3, 4, 5, 6, 7, 8]\n}\ndf_product_sales = pd.DataFrame(product_sales)\n\n# \u5408\u5e76\u5546\u54c1\u9500\u91cf\u7edf\u8ba1\ndf_final = pd.merge(df_sorted, df_product_sales, on='product_id', how='left')\n\nprint(\"\\n\u6784\u9020\u5546\u54c1\u9500\u91cf\u6392\u540d\u5b57\u6bb5\u540e:\")\nprint(df_final)<\/code><\/pre>\n\n\n\n<h3 class=\"wp-block-heading\"><span class=\"ez-toc-section\" id=\"8_%E5%AF%B9%E4%BB%B7%E6%A0%BC%E8%BF%9B%E8%A1%8C%E6%A0%87%E5%87%86%E5%8C%96%EF%BC%88Z-score%EF%BC%89\"><\/span>8. \u5bf9\u4ef7\u683c\u8fdb\u884c\u6807\u51c6\u5316\uff08Z-score\uff09<span class=\"ez-toc-section-end\"><\/span><\/h3>\n\n\n\n<pre class=\"wp-block-code\"><code>from scipy.stats import zscore\n\n# \u5bf9amount\u5217\u8fdb\u884cz-score\u6807\u51c6\u5316\ndf_final&#91;'amount_zscore'] = zscore(df_final&#91;'amount'])\n\nprint(\"\\n\u5bf9\u4ef7\u683c\u8fdb\u884c\u6807\u51c6\u5316\u540e:\")\nprint(df_final)<\/code><\/pre>\n\n\n\n<h3 class=\"wp-block-heading\"><span class=\"ez-toc-section\" id=\"9_%E6%9E%84%E9%80%A0%E6%98%AF%E5%90%A6%E5%8F%82%E4%B8%8E%E4%BF%83%E9%94%80%E7%9A%84%E5%B8%83%E5%B0%94%E6%A0%87%E7%AD%BE\"><\/span>9. \u6784\u9020\u662f\u5426\u53c2\u4e0e\u4fc3\u9500\u7684\u5e03\u5c14\u6807\u7b7e<span class=\"ez-toc-section-end\"><\/span><\/h3>\n\n\n\n<pre class=\"wp-block-code\"><code># \u6784\u9020\u662f\u5426\u53c2\u4e0e\u4fc3\u9500\u7684\u5e03\u5c14\u6807\u7b7e\ndf_final&#91;'is_promotion'] = df_final&#91;'promotion'].astype(bool)\n\nprint(\"\\n\u6784\u9020\u662f\u5426\u53c2\u4e0e\u4fc3\u9500\u7684\u5e03\u5c14\u6807\u7b7e\u540e:\")\nprint(df_final)<\/code><\/pre>\n\n\n\n<p>\u7efc\u5408\u4ee5\u4e0a\u6b65\u9aa4\uff0c\u6700\u7ec8\u7684\u8f6c\u6362\u540e\u7684DataFrame\u5982\u4e0b\uff1a<\/p>\n\n\n\n<p>\u8fd9\u6bb5\u4ee3\u7801\u5c55\u793a\u4e86\u4ece\u539f\u59cb\u6570\u636e\u5230\u7ecf\u8fc7\u5168\u9762\u8f6c\u6362\u7684\u6570\u636e\u7684\u8fc7\u7a0b\u3002\u4f60\u53ef\u4ee5\u6839\u636e\u5b9e\u9645\u9700\u6c42\u8c03\u6574\u6bcf\u4e00\u6b65\u7684\u64cd\u4f5c\u3002<\/p>\n\n\n\n<pre class=\"wp-block-code\"><code>import pandas as pd\r\nimport numpy as np\r\nfrom scipy.stats import zscore\r\n\r\n# \u521b\u5efa\u793a\u4f8bDataFrame\r\ndata = {\r\n    'order_id': &#91;1, 2, 3, 4, 5, 6, 7, 8],\r\n    'product_id': &#91;'A001', 'B002', 'D004', 'E005', 'F006', 'G007', 'H008', 'I009'],\r\n    'category_code': &#91;'C1', 'C2', 'C1', 'C3', 'C4', 'C5', 'C6', 'C7'],\r\n    'amount': &#91;100.00, 200.00, 300.00, 400.00, 500.00, 600.00, 700.00, 800.00],\r\n    'original_price': &#91;120.00, 220.00, 320.00, 420.00, 520.00, 620.00, 720.00, 820.00],\r\n    'quantity': &#91;1, 2, 1, 1, 2, 1, 1, 2],\r\n    'order_date': &#91;'2025-06-01', '2025-06-02', '2025-06-03', '2025-06-04', '2025-06-05', '2025-06-06', '2025-06-07', '2025-06-08'],\r\n    'customer_id': &#91;101, 102, 103, 104, 105, 106, 107, 108],\r\n    'promotion': &#91;False, True, False, True, False, True, False, True]\r\n}\r\n\r\ndf = pd.DataFrame(data)\r\n\r\n# \u8f6c\u6362order_date\u4e3a\u65e5\u671f\u683c\u5f0f\r\ndf&#91;'order_date'] = pd.to_datetime(df&#91;'order_date'])\r\n\r\n# \u63d0\u53d6\u5e74\u3001\u6708\u3001\u5468\u3001\u661f\u671f\u51e0\r\ndf&#91;'year'] = df&#91;'order_date'].dt.year\r\ndf&#91;'month'] = df&#91;'order_date'].dt.month\r\ndf&#91;'week_of_year'] = df&#91;'order_date'].dt.isocalendar().week.astype(int)\r\ndf&#91;'day_of_week'] = df&#91;'order_date'].dt.dayofweek\r\n\r\n# \u5c06category_code\u8fdb\u884cone-hot encoding\r\ndf_encoded = pd.get_dummies(df, columns=&#91;'category_code'], prefix='cat')\r\n\r\n# \u8ba1\u7b97\u8ba2\u5355\u603b\u91d1\u989d\r\ndf_encoded&#91;'total_amount'] = df_encoded&#91;'amount'] * df_encoded&#91;'quantity']\r\n\r\n# \u8ba1\u7b97\u6298\u6263\u7387\r\ndf_encoded&#91;'discount_rate'] = (df_encoded&#91;'amount'] \/ df_encoded&#91;'original_price']).round(2)\r\n\r\n# \u521b\u5efa\u5ba2\u6237\u8d2d\u4e70\u8bb0\u5f55\u7684DataFrame\r\npurchase_history = {\r\n    'customer_id': &#91;101, 102, 103, 104, 105, 106, 107, 108, 101, 102, 103, 104],\r\n    'purchase_count': &#91;2, 3, 1, 2, 1, 3, 2, 1, 1, 2, 1, 3]\r\n}\r\ndf_purchase_history = pd.DataFrame(purchase_history)\r\n\r\n# \u5408\u5e76\u5ba2\u6237\u8d2d\u4e70\u8bb0\u5f55\r\ndf_transformed = pd.merge(df_encoded, df_purchase_history, on='customer_id', how='left')\r\n\r\n# \u786e\u4fddorder_date\u662fdatetime\u7c7b\u578b\r\ndf_transformed&#91;'order_date'] = pd.to_datetime(df_transformed&#91;'order_date'])\r\n\r\n# \u6309order_date\u6392\u5e8f\r\ndf_sorted = df_transformed.sort_values(by='order_date')\r\n\r\n# \u521b\u5efa\u5546\u54c1\u9500\u91cf\u7edf\u8ba1\u7684DataFrame\r\nproduct_sales = {\r\n    'product_id': &#91;'A001', 'B002', 'D004', 'E005', 'F006', 'G007', 'H008', 'I009'],\r\n    'sales_rank': &#91;1, 2, 3, 4, 5, 6, 7, 8]\r\n}\r\ndf_product_sales = pd.DataFrame(product_sales)\r\n\r\n# \u5408\u5e76\u5546\u54c1\u9500\u91cf\u7edf\u8ba1\r\ndf_final = pd.merge(df_sorted, df_product_sales, on='product_id', how='left')\r\n\r\n# \u5bf9amount\u5217\u8fdb\u884cz-score\u6807\u51c6\u5316\r\ndf_final&#91;'amount_zscore'] = zscore(df_final&#91;'amount'])\r\n\r\n# \u6784\u9020\u662f\u5426\u53c2\u4e0e\u4fc3\u9500\u7684\u5e03\u5c14\u6807\u7b7e\r\ndf_final&#91;'is_promotion'] = df_final&#91;'promotion'].astype(bool)\r\n\r\nprint(\"\u6700\u7ec8\u8f6c\u6362\u540e\u7684\u6570\u636e:\")\r\nprint(df_final)\r\n\r\n\r\n\r\n<\/code><\/pre>\n","protected":false},"excerpt":{"rendered":"<p>\u5e38\u89c1\u7528\u7684\u6570\u636e\u8f6c\u6362\u5206\u7c7b\uff1a \u6211\u4eec\u5c06\u5c55\u793a\u5982\u4f55\u8fdb\u884c\u8fd9\u4e9b\u5e38\u89c1\u7684\u6570\u636e\u8f6c\u6362\u4efb\u52a1\u3002\u5047\u8bbe\u6211\u4eec\u6709\u4e00\u4e2a\u5305\u542b\u9500\u552e\u8ba2\u5355\u6570\u636e\u7684D&hellip; <a href=\"http:\/\/viplao.com\/index.php\/2025\/06\/28\/%e3%80%90python%e5%ae%9e%e8%b7%b5%e7%bb%8f%e9%aa%8c%e3%80%91%e7%94%b5%e5%95%86%e5%b9%b3%e5%8f%b0%e9%94%80%e5%94%ae%e6%95%b0%e6%8d%ae%e5%88%86%e6%9e%90%e5%ae%9e%e8%b7%b5%e5%88%86%e8%a7%a3\/\" class=\"more-link read-more\" rel=\"bookmark\">\u7ee7\u7eed\u9605\u8bfb <span class=\"screen-reader-text\">\u3010Python10\u5e74\u7ecf\u9a8c\u603b\u7ed3\u3011\u7b2c\u4e09\u8bfe \u7535\u5546\u5e73\u53f0\u9500\u552e\u6570\u636e\u5206\u6790\u5b9e\u8df5\u5206\u89e3 \u2013 \u6570\u636e\u8f6c\u6362\uff08Data Transformation\uff09<\/span><i class=\"fa fa-arrow-right\"><\/i><\/a><\/p>\n","protected":false},"author":1,"featured_media":0,"comment_status":"closed","ping_status":"open","sticky":false,"template":"","format":"standard","meta":[],"categories":[1],"tags":[28],"views":797,"_links":{"self":[{"href":"http:\/\/viplao.com\/index.php\/wp-json\/wp\/v2\/posts\/3538"}],"collection":[{"href":"http:\/\/viplao.com\/index.php\/wp-json\/wp\/v2\/posts"}],"about":[{"href":"http:\/\/viplao.com\/index.php\/wp-json\/wp\/v2\/types\/post"}],"author":[{"embeddable":true,"href":"http:\/\/viplao.com\/index.php\/wp-json\/wp\/v2\/users\/1"}],"replies":[{"embeddable":true,"href":"http:\/\/viplao.com\/index.php\/wp-json\/wp\/v2\/comments?post=3538"}],"version-history":[{"count":3,"href":"http:\/\/viplao.com\/index.php\/wp-json\/wp\/v2\/posts\/3538\/revisions"}],"predecessor-version":[{"id":3561,"href":"http:\/\/viplao.com\/index.php\/wp-json\/wp\/v2\/posts\/3538\/revisions\/3561"}],"wp:attachment":[{"href":"http:\/\/viplao.com\/index.php\/wp-json\/wp\/v2\/media?parent=3538"}],"wp:term":[{"taxonomy":"category","embeddable":true,"href":"http:\/\/viplao.com\/index.php\/wp-json\/wp\/v2\/categories?post=3538"},{"taxonomy":"post_tag","embeddable":true,"href":"http:\/\/viplao.com\/index.php\/wp-json\/wp\/v2\/tags?post=3538"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}