|
1388 | 1388 | "### es la importancia de los predictores " |
1389 | 1389 | ] |
1390 | 1390 | }, |
| 1391 | + { |
| 1392 | + "cell_type": "markdown", |
| 1393 | + "id": "4ed6dcbe-9e95-4cc4-b8fe-13757512e41d", |
| 1394 | + "metadata": {}, |
| 1395 | + "source": [ |
| 1396 | + "## Árboles de Regresión" |
| 1397 | + ] |
| 1398 | + }, |
| 1399 | + { |
| 1400 | + "cell_type": "markdown", |
| 1401 | + "id": "2e85b066-8a10-496d-a150-781a8e5a14e9", |
| 1402 | + "metadata": {}, |
| 1403 | + "source": [ |
| 1404 | + "chrome-extension://efaidnbmnnnibpcajpcglclefindmkaj/https://www2.stat.duke.edu/~rcs46/lectures_2017/08-trees/08-tree-regression.pdf" |
| 1405 | + ] |
| 1406 | + }, |
| 1407 | + { |
| 1408 | + "cell_type": "code", |
| 1409 | + "execution_count": 68, |
| 1410 | + "id": "afa2bc0f-ddde-4f9a-976c-47016f6060d9", |
| 1411 | + "metadata": {}, |
| 1412 | + "outputs": [], |
| 1413 | + "source": [ |
| 1414 | + "import pandas as pd" |
| 1415 | + ] |
| 1416 | + }, |
| 1417 | + { |
| 1418 | + "cell_type": "code", |
| 1419 | + "execution_count": 69, |
| 1420 | + "id": "3dd68ead-37e9-402f-8451-1ee941e90771", |
| 1421 | + "metadata": {}, |
| 1422 | + "outputs": [ |
| 1423 | + { |
| 1424 | + "data": { |
| 1425 | + "text/html": [ |
| 1426 | + "<div>\n", |
| 1427 | + "<style scoped>\n", |
| 1428 | + " .dataframe tbody tr th:only-of-type {\n", |
| 1429 | + " vertical-align: middle;\n", |
| 1430 | + " }\n", |
| 1431 | + "\n", |
| 1432 | + " .dataframe tbody tr th {\n", |
| 1433 | + " vertical-align: top;\n", |
| 1434 | + " }\n", |
| 1435 | + "\n", |
| 1436 | + " .dataframe thead th {\n", |
| 1437 | + " text-align: right;\n", |
| 1438 | + " }\n", |
| 1439 | + "</style>\n", |
| 1440 | + "<table border=\"1\" class=\"dataframe\">\n", |
| 1441 | + " <thead>\n", |
| 1442 | + " <tr style=\"text-align: right;\">\n", |
| 1443 | + " <th></th>\n", |
| 1444 | + " <th>crim</th>\n", |
| 1445 | + " <th>zn</th>\n", |
| 1446 | + " <th>indus</th>\n", |
| 1447 | + " <th>chas</th>\n", |
| 1448 | + " <th>nox</th>\n", |
| 1449 | + " <th>rm</th>\n", |
| 1450 | + " <th>age</th>\n", |
| 1451 | + " <th>dis</th>\n", |
| 1452 | + " <th>rad</th>\n", |
| 1453 | + " <th>tax</th>\n", |
| 1454 | + " <th>ptratio</th>\n", |
| 1455 | + " <th>black</th>\n", |
| 1456 | + " <th>lstat</th>\n", |
| 1457 | + " <th>medv</th>\n", |
| 1458 | + " </tr>\n", |
| 1459 | + " </thead>\n", |
| 1460 | + " <tbody>\n", |
| 1461 | + " <tr>\n", |
| 1462 | + " <th>0</th>\n", |
| 1463 | + " <td>0.00632</td>\n", |
| 1464 | + " <td>18.0</td>\n", |
| 1465 | + " <td>2.31</td>\n", |
| 1466 | + " <td>0</td>\n", |
| 1467 | + " <td>0.538</td>\n", |
| 1468 | + " <td>6.575</td>\n", |
| 1469 | + " <td>65.2</td>\n", |
| 1470 | + " <td>4.0900</td>\n", |
| 1471 | + " <td>1</td>\n", |
| 1472 | + " <td>296</td>\n", |
| 1473 | + " <td>15.3</td>\n", |
| 1474 | + " <td>396.90</td>\n", |
| 1475 | + " <td>4.98</td>\n", |
| 1476 | + " <td>24.0</td>\n", |
| 1477 | + " </tr>\n", |
| 1478 | + " <tr>\n", |
| 1479 | + " <th>1</th>\n", |
| 1480 | + " <td>0.02731</td>\n", |
| 1481 | + " <td>0.0</td>\n", |
| 1482 | + " <td>7.07</td>\n", |
| 1483 | + " <td>0</td>\n", |
| 1484 | + " <td>0.469</td>\n", |
| 1485 | + " <td>6.421</td>\n", |
| 1486 | + " <td>78.9</td>\n", |
| 1487 | + " <td>4.9671</td>\n", |
| 1488 | + " <td>2</td>\n", |
| 1489 | + " <td>242</td>\n", |
| 1490 | + " <td>17.8</td>\n", |
| 1491 | + " <td>396.90</td>\n", |
| 1492 | + " <td>9.14</td>\n", |
| 1493 | + " <td>21.6</td>\n", |
| 1494 | + " </tr>\n", |
| 1495 | + " <tr>\n", |
| 1496 | + " <th>2</th>\n", |
| 1497 | + " <td>0.02729</td>\n", |
| 1498 | + " <td>0.0</td>\n", |
| 1499 | + " <td>7.07</td>\n", |
| 1500 | + " <td>0</td>\n", |
| 1501 | + " <td>0.469</td>\n", |
| 1502 | + " <td>7.185</td>\n", |
| 1503 | + " <td>61.1</td>\n", |
| 1504 | + " <td>4.9671</td>\n", |
| 1505 | + " <td>2</td>\n", |
| 1506 | + " <td>242</td>\n", |
| 1507 | + " <td>17.8</td>\n", |
| 1508 | + " <td>392.83</td>\n", |
| 1509 | + " <td>4.03</td>\n", |
| 1510 | + " <td>34.7</td>\n", |
| 1511 | + " </tr>\n", |
| 1512 | + " <tr>\n", |
| 1513 | + " <th>3</th>\n", |
| 1514 | + " <td>0.03237</td>\n", |
| 1515 | + " <td>0.0</td>\n", |
| 1516 | + " <td>2.18</td>\n", |
| 1517 | + " <td>0</td>\n", |
| 1518 | + " <td>0.458</td>\n", |
| 1519 | + " <td>6.998</td>\n", |
| 1520 | + " <td>45.8</td>\n", |
| 1521 | + " <td>6.0622</td>\n", |
| 1522 | + " <td>3</td>\n", |
| 1523 | + " <td>222</td>\n", |
| 1524 | + " <td>18.7</td>\n", |
| 1525 | + " <td>394.63</td>\n", |
| 1526 | + " <td>2.94</td>\n", |
| 1527 | + " <td>33.4</td>\n", |
| 1528 | + " </tr>\n", |
| 1529 | + " <tr>\n", |
| 1530 | + " <th>4</th>\n", |
| 1531 | + " <td>0.06905</td>\n", |
| 1532 | + " <td>0.0</td>\n", |
| 1533 | + " <td>2.18</td>\n", |
| 1534 | + " <td>0</td>\n", |
| 1535 | + " <td>0.458</td>\n", |
| 1536 | + " <td>7.147</td>\n", |
| 1537 | + " <td>54.2</td>\n", |
| 1538 | + " <td>6.0622</td>\n", |
| 1539 | + " <td>3</td>\n", |
| 1540 | + " <td>222</td>\n", |
| 1541 | + " <td>18.7</td>\n", |
| 1542 | + " <td>396.90</td>\n", |
| 1543 | + " <td>5.33</td>\n", |
| 1544 | + " <td>36.2</td>\n", |
| 1545 | + " </tr>\n", |
| 1546 | + " </tbody>\n", |
| 1547 | + "</table>\n", |
| 1548 | + "</div>" |
| 1549 | + ], |
| 1550 | + "text/plain": [ |
| 1551 | + " crim zn indus chas nox rm age dis rad tax ptratio \\\n", |
| 1552 | + "0 0.00632 18.0 2.31 0 0.538 6.575 65.2 4.0900 1 296 15.3 \n", |
| 1553 | + "1 0.02731 0.0 7.07 0 0.469 6.421 78.9 4.9671 2 242 17.8 \n", |
| 1554 | + "2 0.02729 0.0 7.07 0 0.469 7.185 61.1 4.9671 2 242 17.8 \n", |
| 1555 | + "3 0.03237 0.0 2.18 0 0.458 6.998 45.8 6.0622 3 222 18.7 \n", |
| 1556 | + "4 0.06905 0.0 2.18 0 0.458 7.147 54.2 6.0622 3 222 18.7 \n", |
| 1557 | + "\n", |
| 1558 | + " black lstat medv \n", |
| 1559 | + "0 396.90 4.98 24.0 \n", |
| 1560 | + "1 396.90 9.14 21.6 \n", |
| 1561 | + "2 392.83 4.03 34.7 \n", |
| 1562 | + "3 394.63 2.94 33.4 \n", |
| 1563 | + "4 396.90 5.33 36.2 " |
| 1564 | + ] |
| 1565 | + }, |
| 1566 | + "execution_count": 69, |
| 1567 | + "metadata": {}, |
| 1568 | + "output_type": "execute_result" |
| 1569 | + } |
| 1570 | + ], |
| 1571 | + "source": [ |
| 1572 | + "data = pd.read_csv(\"../datasets/boston/Boston.csv\")\n", |
| 1573 | + "data.head()" |
| 1574 | + ] |
| 1575 | + }, |
| 1576 | + { |
| 1577 | + "cell_type": "markdown", |
| 1578 | + "id": "88c7a8bf-0d46-43bc-9046-06fb28c784ff", |
| 1579 | + "metadata": {}, |
| 1580 | + "source": [ |
| 1581 | + "https://www.kaggle.com/code/prasadperera/the-boston-housing-dataset" |
| 1582 | + ] |
| 1583 | + }, |
| 1584 | + { |
| 1585 | + "cell_type": "code", |
| 1586 | + "execution_count": 70, |
| 1587 | + "id": "d85726b1-aca5-45f4-812b-d2572aeadcc0", |
| 1588 | + "metadata": {}, |
| 1589 | + "outputs": [ |
| 1590 | + { |
| 1591 | + "data": { |
| 1592 | + "text/plain": [ |
| 1593 | + "(506, 14)" |
| 1594 | + ] |
| 1595 | + }, |
| 1596 | + "execution_count": 70, |
| 1597 | + "metadata": {}, |
| 1598 | + "output_type": "execute_result" |
| 1599 | + } |
| 1600 | + ], |
| 1601 | + "source": [ |
| 1602 | + "data.shape" |
| 1603 | + ] |
| 1604 | + }, |
| 1605 | + { |
| 1606 | + "cell_type": "code", |
| 1607 | + "execution_count": 71, |
| 1608 | + "id": "3a861e3f-c183-4f01-aaf1-c388f1b531dd", |
| 1609 | + "metadata": {}, |
| 1610 | + "outputs": [], |
| 1611 | + "source": [ |
| 1612 | + "colnames = data.columns.values.tolist()\n", |
| 1613 | + "predictors = colnames[:13]\n", |
| 1614 | + "target = colnames[13]\n", |
| 1615 | + "X=data[predictors]\n", |
| 1616 | + "Y = data[target]" |
| 1617 | + ] |
| 1618 | + }, |
1391 | 1619 | { |
1392 | 1620 | "cell_type": "code", |
1393 | 1621 | "execution_count": null, |
1394 | | - "id": "d3dfa653-8e21-412e-bc48-6c8f56b8835d", |
| 1622 | + "id": "be2adede-53a0-4306-b4e2-00b1a6edb6d6", |
1395 | 1623 | "metadata": {}, |
1396 | 1624 | "outputs": [], |
1397 | 1625 | "source": [] |
|
0 commit comments