{"cells": [{"cell_type": "markdown", "metadata": {}, "source": ["# S\u00e9ance big data\n", "\n", "D\u00e9couverte de plusieurs fa\u00e7ons de calculer des statistiques sur des fichiers volumineux."]}, {"cell_type": "code", "execution_count": 1, "metadata": {}, "outputs": [{"data": {"text/html": ["
\n", ""], "text/plain": ["\n", " | FLX_ANN_MOI | \n", "ORG_CLE_REG | \n", "AGE_BEN_SNDS | \n", "BEN_RES_REG | \n", "BEN_CMU_TOP | \n", "BEN_QLT_COD | \n", "BEN_SEX_COD | \n", "DDP_SPE_COD | \n", "ETE_CAT_SNDS | \n", "ETE_REG_COD | \n", "... | \n", "PSE_ACT_CAT | \n", "PSE_SPE_SNDS | \n", "PSE_STJ_SNDS | \n", "PRE_INS_REG | \n", "PSP_ACT_SNDS | \n", "PSP_ACT_CAT | \n", "PSP_SPE_SNDS | \n", "PSP_STJ_SNDS | \n", "TOP_PS5_TRG | \n", "Unnamed: 55 | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "201612 | \n", "76 | \n", "20 | \n", "76 | \n", "9 | \n", "1 | \n", "1 | \n", "0 | \n", "1101 | \n", "76 | \n", "... | \n", "0 | \n", "14 | \n", "2 | \n", "99 | \n", "0 | \n", "0 | \n", "1 | \n", "2 | \n", "9 | \n", "NaN | \n", "
1 | \n", "201612 | \n", "28 | \n", "30 | \n", "28 | \n", "9 | \n", "1 | \n", "2 | \n", "0 | \n", "9999 | \n", "99 | \n", "... | \n", "2 | \n", "0 | \n", "1 | \n", "99 | \n", "0 | \n", "0 | \n", "6 | \n", "2 | \n", "9 | \n", "NaN | \n", "
2 | \n", "201612 | \n", "27 | \n", "60 | \n", "93 | \n", "9 | \n", "2 | \n", "1 | \n", "0 | \n", "9999 | \n", "99 | \n", "... | \n", "2 | \n", "0 | \n", "9 | \n", "93 | \n", "0 | \n", "1 | \n", "1 | \n", "9 | \n", "9 | \n", "NaN | \n", "
3 | \n", "201612 | \n", "32 | \n", "40 | \n", "32 | \n", "9 | \n", "2 | \n", "2 | \n", "0 | \n", "9999 | \n", "99 | \n", "... | \n", "1 | \n", "1 | \n", "1 | \n", "32 | \n", "0 | \n", "1 | \n", "1 | \n", "1 | \n", "9 | \n", "NaN | \n", "
4 | \n", "201612 | \n", "32 | \n", "30 | \n", "32 | \n", "9 | \n", "1 | \n", "2 | \n", "0 | \n", "2206 | \n", "32 | \n", "... | \n", "0 | \n", "0 | \n", "2 | \n", "99 | \n", "0 | \n", "0 | \n", "1 | \n", "2 | \n", "9 | \n", "NaN | \n", "
5 rows \u00d7 56 columns
\n", "\n", " | 0 | \n", "1 | \n", "2 | \n", "3 | \n", "4 | \n", "
---|---|---|---|---|---|
FLX_ANN_MOI | \n", "201612.0 | \n", "201612.00 | \n", "201612.0 | \n", "201612.0 | \n", "201612.0 | \n", "
ORG_CLE_REG | \n", "76.0 | \n", "28.00 | \n", "27.0 | \n", "32.0 | \n", "32.0 | \n", "
AGE_BEN_SNDS | \n", "20.0 | \n", "30.00 | \n", "60.0 | \n", "40.0 | \n", "30.0 | \n", "
BEN_RES_REG | \n", "76.0 | \n", "28.00 | \n", "93.0 | \n", "32.0 | \n", "32.0 | \n", "
BEN_CMU_TOP | \n", "9.0 | \n", "9.00 | \n", "9.0 | \n", "9.0 | \n", "9.0 | \n", "
BEN_QLT_COD | \n", "1.0 | \n", "1.00 | \n", "2.0 | \n", "2.0 | \n", "1.0 | \n", "
BEN_SEX_COD | \n", "1.0 | \n", "2.00 | \n", "1.0 | \n", "2.0 | \n", "2.0 | \n", "
DDP_SPE_COD | \n", "0.0 | \n", "0.00 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "
ETE_CAT_SNDS | \n", "1101.0 | \n", "9999.00 | \n", "9999.0 | \n", "9999.0 | \n", "2206.0 | \n", "
ETE_REG_COD | \n", "76.0 | \n", "99.00 | \n", "99.0 | \n", "99.0 | \n", "32.0 | \n", "
ETE_TYP_SNDS | \n", "1.0 | \n", "99.00 | \n", "99.0 | \n", "99.0 | \n", "6.0 | \n", "
ETP_REG_COD | \n", "76.0 | \n", "24.00 | \n", "99.0 | \n", "99.0 | \n", "32.0 | \n", "
ETP_CAT_SNDS | \n", "1101.0 | \n", "1102.00 | \n", "9999.0 | \n", "9999.0 | \n", "2206.0 | \n", "
MDT_TYP_COD | \n", "9.0 | \n", "9.00 | \n", "9.0 | \n", "9.0 | \n", "9.0 | \n", "
MFT_COD | \n", "3.0 | \n", "99.00 | \n", "99.0 | \n", "99.0 | \n", "36.0 | \n", "
PRS_FJH_TYP | \n", "0.0 | \n", "0.00 | \n", "8.0 | \n", "0.0 | \n", "0.0 | \n", "
PRS_ACT_COG | \n", "2.0 | \n", "1.00 | \n", "1.0 | \n", "2.0 | \n", "1.0 | \n", "
PRS_ACT_NBR | \n", "1.0 | \n", "5.00 | \n", "NaN | \n", "2.0 | \n", "1.0 | \n", "
PRS_ACT_QTE | \n", "1.0 | \n", "1.00 | \n", "1.0 | \n", "2.0 | \n", "1.0 | \n", "
PRS_DEP_MNT | \n", "0.0 | \n", "0.00 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "
PRS_PAI_MNT | \n", "46.0 | \n", "0.51 | \n", "0.0 | \n", "46.0 | \n", "23.0 | \n", "
PRS_REM_BSE | \n", "46.0 | \n", "0.51 | \n", "0.0 | \n", "46.0 | \n", "23.0 | \n", "
PRS_REM_MNT | \n", "46.0 | \n", "0.51 | \n", "-0.5 | \n", "32.2 | \n", "23.0 | \n", "
FLT_ACT_COG | \n", "2.0 | \n", "1.00 | \n", "1.0 | \n", "2.0 | \n", "1.0 | \n", "
FLT_ACT_NBR | \n", "1.0 | \n", "5.00 | \n", "NaN | \n", "2.0 | \n", "1.0 | \n", "
FLT_ACT_QTE | \n", "1.0 | \n", "1.00 | \n", "1.0 | \n", "2.0 | \n", "1.0 | \n", "
FLT_PAI_MNT | \n", "46.0 | \n", "0.51 | \n", "0.0 | \n", "46.0 | \n", "23.0 | \n", "
FLT_DEP_MNT | \n", "0.0 | \n", "0.00 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "
FLT_REM_MNT | \n", "46.0 | \n", "0.51 | \n", "-0.5 | \n", "32.2 | \n", "23.0 | \n", "
SOI_ANN | \n", "2016.0 | \n", "2016.00 | \n", "2016.0 | \n", "2016.0 | \n", "2016.0 | \n", "
SOI_MOI | \n", "12.0 | \n", "12.00 | \n", "12.0 | \n", "12.0 | \n", "12.0 | \n", "
ASU_NAT | \n", "40.0 | \n", "10.00 | \n", "10.0 | \n", "10.0 | \n", "10.0 | \n", "
ATT_NAT | \n", "0.0 | \n", "0.00 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "
CPL_COD | \n", "0.0 | \n", "0.00 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "
CPT_ENV_TYP | \n", "9.0 | \n", "9.00 | \n", "9.0 | \n", "9.0 | \n", "9.0 | \n", "
DRG_AFF_NAT | \n", "99.0 | \n", "99.00 | \n", "99.0 | \n", "99.0 | \n", "99.0 | \n", "
ETE_IND_TAA | \n", "1.0 | \n", "9.00 | \n", "9.0 | \n", "9.0 | \n", "0.0 | \n", "
EXO_MTF | \n", "99.0 | \n", "99.00 | \n", "99.0 | \n", "99.0 | \n", "99.0 | \n", "
MTM_NAT | \n", "9.0 | \n", "9.00 | \n", "9.0 | \n", "9.0 | \n", "9.0 | \n", "
PRS_NAT | \n", "1117.0 | \n", "3380.00 | \n", "1972.0 | \n", "1111.0 | \n", "1111.0 | \n", "
PRS_PPU_SEC | \n", "1.0 | \n", "2.00 | \n", "2.0 | \n", "2.0 | \n", "2.0 | \n", "
PRS_REM_TAU | \n", "100.0 | \n", "100.00 | \n", "100.0 | \n", "70.0 | \n", "100.0 | \n", "
PRS_REM_TYP | \n", "99.0 | \n", "99.00 | \n", "99.0 | \n", "99.0 | \n", "99.0 | \n", "
PRS_PDS_QCP | \n", "3.0 | \n", "31.00 | \n", "31.0 | \n", "10.0 | \n", "31.0 | \n", "
EXE_INS_REG | \n", "99.0 | \n", "28.00 | \n", "93.0 | \n", "32.0 | \n", "99.0 | \n", "
PSE_ACT_SNDS | \n", "0.0 | \n", "50.00 | \n", "50.0 | \n", "0.0 | \n", "19.0 | \n", "
PSE_ACT_CAT | \n", "0.0 | \n", "2.00 | \n", "2.0 | \n", "1.0 | \n", "0.0 | \n", "
PSE_SPE_SNDS | \n", "14.0 | \n", "0.00 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "
PSE_STJ_SNDS | \n", "2.0 | \n", "1.00 | \n", "9.0 | \n", "1.0 | \n", "2.0 | \n", "
PRE_INS_REG | \n", "99.0 | \n", "99.00 | \n", "93.0 | \n", "32.0 | \n", "99.0 | \n", "
PSP_ACT_SNDS | \n", "0.0 | \n", "0.00 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "
PSP_ACT_CAT | \n", "0.0 | \n", "0.00 | \n", "1.0 | \n", "1.0 | \n", "0.0 | \n", "
PSP_SPE_SNDS | \n", "1.0 | \n", "6.00 | \n", "1.0 | \n", "1.0 | \n", "1.0 | \n", "
PSP_STJ_SNDS | \n", "2.0 | \n", "2.00 | \n", "9.0 | \n", "1.0 | \n", "2.0 | \n", "
TOP_PS5_TRG | \n", "9.0 | \n", "9.00 | \n", "9.0 | \n", "9.0 | \n", "9.0 | \n", "
Unnamed: 55 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "
\n", " | AGE_BEN_SNDS | \n", "Tranche d'Age B\u00e9n\u00e9ficiaire au moment des soins | \n", "
---|---|---|
0 | \n", "ASU_NAT | \n", "Nature d'Assurance | \n", "
1 | \n", "ATT_NAT | \n", "Nature de l'Accident du Travail | \n", "
2 | \n", "BEN_CMU_TOP | \n", "Top B\u00e9n\u00e9ficiaire CMU-C | \n", "
3 | \n", "BEN_QLT_COD | \n", "Qualit\u00e9 du B\u00e9n\u00e9ficiaire | \n", "
4 | \n", "BEN_RES_ZEAT | \n", "ZEAT de R\u00e9sidence du B\u00e9n\u00e9ficiaire | \n", "
5 | \n", "BEN_SEX_COD | \n", "Sexe du B\u00e9n\u00e9ficiaire | \n", "
6 | \n", "CPL_COD | \n", "Compl\u00e9ment d'Acte | \n", "
7 | \n", "CPT_ENV_TYP | \n", "Type d'Enveloppe | \n", "
8 | \n", "DDP_SPE_COD | \n", "Discipline de Prestation Etb Ex\u00e9cutant | \n", "
9 | \n", "DRG_AFF_NAT | \n", "Nature du Destinataire de R\u00e8glement affin\u00e9 | \n", "
10 | \n", "ETE_CAT_SNDS | \n", "Cat\u00e9gorie Etb Ex\u00e9cutant | \n", "
11 | \n", "ETE_IND_TAA | \n", "Indicateur TAA Priv\u00e9/Public | \n", "
12 | \n", "ETE_TYP_SNDS | \n", "Type Etb Ex\u00e9cutant | \n", "
13 | \n", "ETE_ZEAT_COD | \n", "ZEAT d'Implantation Etb Ex\u00e9cutant | \n", "
14 | \n", "ETP_CAT_SNDS | \n", "Cat\u00e9gorie Etb Prescripteur | \n", "
15 | \n", "ETP_ZEAT_COD | \n", "ZEAT d'Implantation Etb Prescripteur | \n", "
16 | \n", "EXE_INS_ZEAT | \n", "ZEAT du PS Ex\u00e9cutant | \n", "
17 | \n", "EXO_MTF | \n", "Motif d'Exon\u00e9ration du Ticket Mod\u00e9rateur | \n", "
18 | \n", "FLT_ACT_COG | \n", "Coefficient Global de la Prestation Pr\u00e9filtr\u00e9 | \n", "
19 | \n", "FLT_ACT_NBR | \n", "D\u00e9nombrement de la Prestation Pr\u00e9filtr\u00e9 | \n", "
20 | \n", "FLT_ACT_QTE | \n", "Quantit\u00e9 de la Prestation Pr\u00e9filtr\u00e9e | \n", "
21 | \n", "FLT_DEP_MNT | \n", "Montant du D\u00e9passement de la Prestation Pr\u00e9filtr\u00e9 | \n", "
22 | \n", "FLT_PAI_MNT | \n", "Montant de la D\u00e9pense de la Prestation Pr\u00e9filtr\u00e9e | \n", "
23 | \n", "FLT_REM_MNT | \n", "Montant Vers\u00e9/Rembours\u00e9 Pr\u00e9filtr\u00e9 | \n", "
24 | \n", "FLX_ANN_MOI | \n", "Ann\u00e9e et Mois de Traitement | \n", "
25 | \n", "MDT_TYP_COD | \n", "Mode de Traitement Etb Ex\u00e9cutant | \n", "
26 | \n", "MFT_COD | \n", "Mode de Fixation des Tarifs Etb Ex\u00e9cutant | \n", "
27 | \n", "MTM_NAT | \n", "Modulation du Ticket Mod\u00e9rateur | \n", "
28 | \n", "ORG_CLE_ZEAT | \n", "ZEAT de l'Organisme de Liquidation | \n", "
29 | \n", "PRE_INS_ZEAT | \n", "ZEAT du PS Prescripteur | \n", "
30 | \n", "PRS_ACT_COG | \n", "Coefficient Global | \n", "
31 | \n", "PRS_ACT_NBR | \n", "D\u00e9nombrement | \n", "
32 | \n", "PRS_ACT_QTE | \n", "Quantit\u00e9 | \n", "
33 | \n", "PRS_DEP_MNT | \n", "Montant du D\u00e9passement | \n", "
34 | \n", "PRS_FJH_TYP | \n", "Type de Prise en Charge Forfait Journalier | \n", "
35 | \n", "PRS_NAT | \n", "Nature de Prestation | \n", "
36 | \n", "PRS_PAI_MNT | \n", "Montant de la D\u00e9pense | \n", "
37 | \n", "PRS_PDS_QCP | \n", "Code Qualificatif Parcours de Soins (sortie) | \n", "
38 | \n", "PRS_PPU_SEC | \n", "Code Secteur Priv\u00e9/Public | \n", "
39 | \n", "PRS_REM_BSE | \n", "Base de Remboursement | \n", "
40 | \n", "PRS_REM_MNT | \n", "Montant Vers\u00e9/Rembours\u00e9 | \n", "
41 | \n", "PRS_REM_TAU | \n", "Taux de Remboursement | \n", "
42 | \n", "PRS_REM_TYP | \n", "Type de Remboursement | \n", "
43 | \n", "PSE_ACT_CAT | \n", "Cat\u00e9gorie de l' Ex\u00e9cutant | \n", "
44 | \n", "PSE_ACT_SNDS | \n", "Nature d'Activit\u00e9 PS Ex\u00e9cutant | \n", "
45 | \n", "PSE_SPE_SNDS | \n", "Sp\u00e9cialit\u00e9 M\u00e9dicale PS Ex\u00e9cutant | \n", "
46 | \n", "PSE_STJ_SNDS | \n", "Statut Juridique PS Ex\u00e9cutant | \n", "
47 | \n", "PSP_ACT_CAT | \n", "Cat\u00e9gorie du Prescripteur | \n", "
48 | \n", "PSP_ACT_SNDS | \n", "Nature d'Activit\u00e9 PS Prescripteur | \n", "
49 | \n", "PSP_SPE_SNDS | \n", "Sp\u00e9cialit\u00e9 M\u00e9dicale PS Prescripteur | \n", "
50 | \n", "PSP_STJ_SNDS | \n", "Statut Juridique PS Prescripteur | \n", "
51 | \n", "SOI_ANN | \n", "Ann\u00e9e de Soins | \n", "
52 | \n", "SOI_MOI | \n", "Mois de Soins | \n", "
53 | \n", "TOP_PS5_TRG | \n", "Top P\u00e9rim\u00e8tre hors CMU C et prestations pour i... | \n", "
\n", " | FLX_ANN_MOI | \n", "ORG_CLE_REG | \n", "AGE_BEN_SNDS | \n", "BEN_RES_REG | \n", "BEN_CMU_TOP | \n", "BEN_QLT_COD | \n", "BEN_SEX_COD | \n", "DDP_SPE_COD | \n", "ETE_CAT_SNDS | \n", "ETE_REG_COD | \n", "... | \n", "PSE_ACT_CAT | \n", "PSE_SPE_SNDS | \n", "PSE_STJ_SNDS | \n", "PRE_INS_REG | \n", "PSP_ACT_SNDS | \n", "PSP_ACT_CAT | \n", "PSP_SPE_SNDS | \n", "PSP_STJ_SNDS | \n", "TOP_PS5_TRG | \n", "Unnamed: 55 | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "201612 | \n", "76 | \n", "20 | \n", "76 | \n", "9 | \n", "1 | \n", "1 | \n", "0 | \n", "1101 | \n", "76 | \n", "... | \n", "0 | \n", "14 | \n", "2 | \n", "99 | \n", "0 | \n", "0 | \n", "1 | \n", "2 | \n", "9 | \n", "NaN | \n", "
1 | \n", "201612 | \n", "28 | \n", "30 | \n", "28 | \n", "9 | \n", "1 | \n", "2 | \n", "0 | \n", "9999 | \n", "99 | \n", "... | \n", "2 | \n", "0 | \n", "1 | \n", "99 | \n", "0 | \n", "0 | \n", "6 | \n", "2 | \n", "9 | \n", "NaN | \n", "
2 | \n", "201612 | \n", "27 | \n", "60 | \n", "93 | \n", "9 | \n", "2 | \n", "1 | \n", "0 | \n", "9999 | \n", "99 | \n", "... | \n", "2 | \n", "0 | \n", "9 | \n", "93 | \n", "0 | \n", "1 | \n", "1 | \n", "9 | \n", "9 | \n", "NaN | \n", "
3 | \n", "201612 | \n", "32 | \n", "40 | \n", "32 | \n", "9 | \n", "2 | \n", "2 | \n", "0 | \n", "9999 | \n", "99 | \n", "... | \n", "1 | \n", "1 | \n", "1 | \n", "32 | \n", "0 | \n", "1 | \n", "1 | \n", "1 | \n", "9 | \n", "NaN | \n", "
4 | \n", "201612 | \n", "32 | \n", "30 | \n", "32 | \n", "9 | \n", "1 | \n", "2 | \n", "0 | \n", "2206 | \n", "32 | \n", "... | \n", "0 | \n", "0 | \n", "2 | \n", "99 | \n", "0 | \n", "0 | \n", "1 | \n", "2 | \n", "9 | \n", "NaN | \n", "
5 rows \u00d7 56 columns
\n", "\n", " | AGE_BEN_SNDS | \n", "count(*) | \n", "
---|---|---|
0 | \n", "0 | \n", "10424 | \n", "
1 | \n", "20 | \n", "10948 | \n", "
2 | \n", "30 | \n", "10871 | \n", "
3 | \n", "40 | \n", "11963 | \n", "
4 | \n", "50 | \n", "14475 | \n", "
5 | \n", "60 | \n", "15662 | \n", "
6 | \n", "70 | \n", "13220 | \n", "
7 | \n", "80 | \n", "12281 | \n", "
8 | \n", "99 | \n", "155 | \n", "
\n", " | FLX_ANN_MOI | \n", "ORG_CLE_REG | \n", "AGE_BEN_SNDS | \n", "BEN_RES_REG | \n", "BEN_CMU_TOP | \n", "BEN_QLT_COD | \n", "BEN_SEX_COD | \n", "DDP_SPE_COD | \n", "ETE_CAT_SNDS | \n", "ETE_REG_COD | \n", "... | \n", "PSE_ACT_CAT | \n", "PSE_SPE_SNDS | \n", "PSE_STJ_SNDS | \n", "PRE_INS_REG | \n", "PSP_ACT_SNDS | \n", "PSP_ACT_CAT | \n", "PSP_SPE_SNDS | \n", "PSP_STJ_SNDS | \n", "TOP_PS5_TRG | \n", "Unnamed: 55 | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "201612 | \n", "76 | \n", "20 | \n", "76 | \n", "9 | \n", "1 | \n", "1 | \n", "0 | \n", "1101 | \n", "76 | \n", "... | \n", "0 | \n", "14 | \n", "2 | \n", "99 | \n", "0 | \n", "0 | \n", "1 | \n", "2 | \n", "9 | \n", "NaN | \n", "
1 | \n", "201612 | \n", "28 | \n", "30 | \n", "28 | \n", "9 | \n", "1 | \n", "2 | \n", "0 | \n", "9999 | \n", "99 | \n", "... | \n", "2 | \n", "0 | \n", "1 | \n", "99 | \n", "0 | \n", "0 | \n", "6 | \n", "2 | \n", "9 | \n", "NaN | \n", "
2 rows \u00d7 56 columns
\n", "\n", " | PRS_REM_MNT | \n", "
---|---|
AGE_BEN_SNDS | \n", "\n", " |
0 | \n", "2607345.16 | \n", "
20 | \n", "1714894.46 | \n", "
30 | \n", "3378001.46 | \n", "
40 | \n", "3271108.13 | \n", "
50 | \n", "5011475.59 | \n", "
60 | \n", "6026792.72 | \n", "
70 | \n", "4283277.72 | \n", "
80 | \n", "4181565.36 | \n", "
99 | \n", "19015.33 | \n", "