EDA Dumps 2 PDF
EDA Dumps 2 PDF
January 7, 2021
<IPython.core.display.HTML object>
[5]: fname
[5]: 'C:/Users/Samuel/Documents/Machine_Learning/datasets/Dumps/Dumps.csv'
[7]: df.shape
[8]: df.columns
1
[8]: Index(['TimeArrived', 'Truck', 'Destino', 'Origen', 'Shovel', 'Tronadura',
'Tons', 'Distancia', 'TpoViaje', 'TpoEsperaDump', 'TpoDump',
'TipoMIneral', 'OpCAEX', 'OpSHV', 'ExtraLoad'],
dtype='object')
[9]: df.describe()
ExtraLoad
count 2.141621e+06
mean 3.782182e-04
std 1.944416e-02
min 0.000000e+00
25% 0.000000e+00
50% 0.000000e+00
75% 0.000000e+00
max 1.000000e+00
[10]: df.head(5)
2
3 Mineral Media 0985 4243 0
4 Mineral Media 6574 4243 0
[11]: df = df[df['ExtraLoad']!=1]
[12]: df.shape
df['Fase'] = df['Origen'].str[:4]
df['Banco'] = df['Origen'].str[5:9]
df['Malla'] = df['Origen'].str[10:12]
df['Otro'] = df['Origen'].str[-3:]
df['velocidad'] = np.where(df['TpoViaje']>0, round(df['Distancia'] /␣
,→df['TpoViaje'] / 16.6666666666666666,2), -1)
del df['Tronadura']
[15]: df.groupby('Truck').size()
[15]: Truck
CA01 164
CA08 174
CA09 233
CA100 27982
CA101 28238
CA102 27168
CA103 20625
CA104 14670
CA105 14209
CA106 12201
CA107 11845
CA11 168
CA13 180
CA28 2705
CA29 4440
CA30 9785
CA50 41859
CA51 41032
CA52 38715
CA53 42359
CA54 41910
CA55 42527
3
CA56 41851
CA57 41484
CA58 43558
CA59 43856
CA60 41336
CA61 44554
CA62 41522
CA63 44779
CA64 43870
CA65 44751
CA66 43018
CA67 41648
CA68 40109
CA69 44803
CA70 42125
CA71 19395
CA72 42134
CA73 43380
CA74 44336
CA76 44294
CA77 43453
CA78 41129
CA79 43274
CA80 41352
CA81 42595
CA82 44235
CA83 44035
CA84 42904
CA85 44005
CA86 46061
CA87 43986
CA88 40653
CA89 41732
CA90 33116
CA91 34768
CA92 34935
CA93 30465
CA94 30156
CA95 30864
CA96 31620
CA97 31924
CA98 32285
CA99 31250
CF10 14
CF11 8
dtype: int64
4
[16]: df.groupby('Destino').size()
[16]: Destino
CH-02 1057559
CH-1 1083252
dtype: int64
[17]: df.groupby('Origen').size()
[17]: Origen
CASE-3020-00/MM1 443
CASE-3020-70/MM1 572
CH-APIRES/MM1 51
CH_3-3065-00/MM1 6
DERR-3230-00/MM1 125
...
STOC-SEC-00/MM1 149
STOC-SECU-00/MM1 1179
STOCK-SEC-00/MM1 224
STOCK_PEL-01/MM1 67
VENT-3027-00/MM1 190
Length: 5990, dtype: int64
[18]: df.groupby('Shovel').size()
[18]: Shovel
BH09 16886
CF02 30522
CF08 69420
CF09 36800
CF10 117978
CF11 123392
PA01 114913
PA03 206792
PA04 360493
PA05 343258
PA06 52401
PA07 451091
PA10 179858
PA11 37007
dtype: int64
[19]: df.groupby('TipoMineral').size()
[19]: TipoMineral
As Alto Prim 272
As Medio Prim 1431
5
Baja Ley 19457
Baja Ley Prim 1638
Esteril 411
Media Ley Prim 21883
Min As Alto 10798
Min As Medio 13325
Min Cal Alto 22259
Min Cal Medio 40696
Mineral Alta 96077
Mineral Media 1903909
Mineral Stock 8650
Nieve 5
dtype: int64
[20]: df.groupby('OpCAEX').size()
[20]: OpCAEX
0001 30
0002 1
0006 2
0013 1
0022 1
...
9850 6824
9917 952
9922 602
9949 7086
mmsunk 11376
Length: 456, dtype: int64
[21]: df.groupby('OpSHV').size()
[21]: OpSHV
0001 267
0002 2
0005 3
0006 4
0011 51
...
9670 9110
9826 35094
9850 1150
9922 3903
mmsunk 52213
Length: 121, dtype: int64
6
[23]: dfZeros
[24]: df = df[(df['Distancia']!=0)&(df['TpoViaje']!=0)]
[25]: df.shape
7
[25]: (2116256, 18)
[26]: df['velocidad'].min()
[26]: 0.56
[28]: dfveloc
8
1363497 1249 8657 STOC 3095 02 MM1 96.00
[30]: df['velocidad'].hist(bins=40)
[30]: <AxesSubplot:>
[31]: df['Distancia'].min()
[31]: 71
[32]: df['Distancia'].hist(bins=40)
[32]: <AxesSubplot:>
9
[33]: df[(df['Distancia']>70000)]
[34]: <AxesSubplot:>
10
[35]: df['Tons'].hist(bins=40)
[35]: <AxesSubplot:>
11
[36]: df[(df['Origen']=='F10N-3260-05/MM2') & (df['Destino']=='CH-02') &␣
,→(df['Distancia']!=0) & (df['OpCAEX']=='8675')]
[37]: df.describe()
velocidad
12
count 2.113793e+06
mean 2.147781e+01
std 3.917369e+00
min 2.460000e+00
25% 1.869000e+01
50% 2.259000e+01
75% 2.456000e+01
max 5.903000e+01
[38]: df.info()
<class 'pandas.core.frame.DataFrame'>
Int64Index: 2113793 entries, 0 to 2141620
Data columns (total 18 columns):
# Column Dtype
--- ------ -----
0 TimeArrived object
1 Truck object
2 Destino object
3 Origen object
4 Shovel object
5 Tons float64
6 Distancia int64
7 TpoViaje float64
8 TpoEsperaDump float64
9 TpoDump float64
10 TipoMineral object
11 OpCAEX object
12 OpSHV object
13 Fase object
14 Banco object
15 Malla object
16 Otro object
17 velocidad float64
dtypes: float64(5), int64(1), object(12)
memory usage: 306.4+ MB
[39]: wrong=df[df['Tons']==0]
[40]: wrong
13
... ... ... ... ... ... ...
2140687 2010-12-02 07:35:08.000 CA82 CH-02 F5SW-2900-01/MM1 CF09 0.0
2140704 2010-12-02 06:57:31.000 CA82 CH-02 F5SW-2900-01/MM1 CF09 0.0
2140743 2010-12-02 05:46:36.000 CA82 CH-02 F5SW-2900-01/MM1 CF09 0.0
2140797 2010-12-02 03:54:29.000 CA82 CH-02 F5SW-2900-01/MM1 CF09 0.0
2140818 2010-12-02 03:18:38.000 CA82 CH-02 F5SW-2900-01/MM1 CF09 0.0
[41]: df = df[df['Tons']!=0]
[43]: df.info()
<class 'pandas.core.frame.DataFrame'>
Int64Index: 2109113 entries, 0 to 2141620
Data columns (total 18 columns):
# Column Dtype
--- ------ -----
0 TimeArrived datetime64[ns]
14
1 Truck object
2 Destino object
3 Origen object
4 Shovel object
5 Tons float64
6 Distancia int64
7 TpoViaje float64
8 TpoEsperaDump float64
9 TpoDump float64
10 TipoMineral object
11 OpCAEX object
12 OpSHV object
13 Fase object
14 Banco object
15 Malla object
16 Otro object
17 velocidad float64
dtypes: datetime64[ns](1), float64(5), int64(1), object(11)
memory usage: 305.7+ MB
[44]: df=df[df['Tons']!=0]
[45]: df.shape
Camiones: 65 Origenes: 5935 Palas: 14 Tipo Mineral: 14 Opers Trucks: 456 Opers
Palas: 121 Nro Fases: 32 Nro Bancos: 110
[47]: # -- Se revisa ahora las variables numéricas que podrían aportar tendencia ---
# -- como Tons, Distancia, TpoViaje, TpoEsperaDump, TpoDump
15
numericals = df[['Tons', 'Distancia', 'TpoViaje', 'TpoEsperaDump', 'TpoDump',␣
,→'velocidad']]
[48]: plt.figure(figsize=[10,8])
n, bins, patches = plt.hist(x=numericals['Tons'], bins=40,␣
,→color='#0504aa',alpha=0.7, rwidth=0.85)
plt.grid(axis='y', alpha=0.75)
plt.xlabel('Value',fontsize=15)
plt.ylabel('Frequency',fontsize=15)
plt.xticks(fontsize=15)
plt.yticks(fontsize=15)
plt.ylabel('Frequency',fontsize=15)
plt.title('Normal Distribution Histogram',fontsize=15)
plt.show()
16
[49]: plt.figure(figsize=[10,8])
n, bins, patches = plt.hist(x=numericals['Distancia'], bins=40,␣
,→color='#0504aa',alpha=0.7, rwidth=0.85)
plt.grid(axis='y', alpha=0.75)
plt.xlabel('Value',fontsize=15)
plt.ylabel('Frequency',fontsize=15)
plt.xticks(fontsize=15)
plt.yticks(fontsize=15)
plt.ylabel('Frequency',fontsize=15)
plt.title('Normal Distribution Histogram',fontsize=15)
plt.show()
17
[50]: plt.figure(figsize=[10,8])
n, bins, patches = plt.hist(x=numericals['TpoViaje'], bins=40,␣
,→color='#0504aa',alpha=0.7, rwidth=0.85)
plt.grid(axis='y', alpha=0.75)
plt.xlabel('Value',fontsize=15)
plt.ylabel('Frequency',fontsize=15)
plt.xticks(fontsize=15)
plt.yticks(fontsize=15)
plt.ylabel('Frequency',fontsize=15)
plt.title('Normal Distribution Histogram',fontsize=15)
plt.show()
18
[51]: plt.figure(figsize=[10,8])
n, bins, patches = plt.hist(x=numericals['TpoEsperaDump'], bins=80,␣
,→color='#0504aa',alpha=0.7, rwidth=0.85)
plt.grid(axis='y', alpha=0.75)
plt.xlabel('Value',fontsize=15)
plt.ylabel('Frequency',fontsize=15)
plt.xticks(fontsize=15)
plt.yticks(fontsize=15)
plt.ylabel('Frequency',fontsize=15)
plt.title('Normal Distribution Histogram',fontsize=15)
plt.show()
19
[52]: plt.figure(figsize=[10,8])
n, bins, patches = plt.hist(x=numericals['velocidad'], bins=40,␣
,→color='#0504aa',alpha=0.7, rwidth=0.85)
plt.grid(axis='y', alpha=0.75)
plt.xlabel('Value',fontsize=15)
plt.ylabel('Frequency',fontsize=15)
plt.xticks(fontsize=15)
plt.yticks(fontsize=15)
plt.ylabel('Frequency',fontsize=15)
plt.title('Normal Distribution Histogram',fontsize=15)
plt.show()
20
[53]: # -- Buscamos algunas distribuciones en variables categoricas y algunas␣
,→numericas (quick view)
21
plt.ylabel(yLa, fontsize=9)
plt.xlabel(xLa, fontsize=9)
plt.tick_params(labelsize=10)
plt.xticks(rotation = 90)
barchart_prep(x, ax)
plt.show()
#x=x.sort_index()
22
[56]: # --> Tonelaje alimentado por Camión
x=round(df.groupby('Truck')['Tons'].sum()/1e3,2)
x=x.sort_values(ascending=False)
23
[57]: # --> Número de Cargas por Pala
x=df['Shovel'].value_counts()
#x=x.sort_index()
24
[58]: # --> Tonelaje cargado por Pala
x=round(df.groupby('Shovel')['Tons'].sum()/1e6,2)
x=x.sort_values(ascending=False)
25
[59]: # --> Tonelaje Alimentado segun el Tipo MIneral
x=round(df.groupby('TipoMineral')['Tons'].sum()/1e6,2)
x=x.sort_values(ascending=False)
26
[60]: # Tonelaje alimentado desde cada fase a la fecha
x=round(df.groupby('Fase')['Tons'].sum()/1e6,2)
x=x.sort_values(ascending=False)
27
[61]: # Tonelaje alimentado desde cada Banco a la fecha
x=round(df.groupby('Banco')['Tons'].sum()/1e3,0)
x=x.sort_values(ascending=False)
28
[62]: s = df.groupby(['Shovel']).TimeArrived.agg({'min','max'})
[63]: s
[65]: s.reset_index()
29
[65]: Shovel min max nrodays
0 BH09 2017-04-28 06:19:11 2020-12-08 02:25:52 1319.837975
1 CF02 2010-12-01 20:02:54 2013-06-14 02:13:47 925.257558
2 CF08 2010-12-02 18:49:10 2017-12-12 11:04:53 2566.677581
3 CF09 2010-12-01 11:17:48 2013-10-04 11:18:22 1038.000394
4 CF10 2013-05-24 14:17:26 2020-12-22 06:28:04 2768.674051
5 CF11 2013-10-10 12:19:15 2020-12-08 22:26:22 2616.421609
6 PA01 2011-03-17 11:54:01 2018-06-28 10:10:07 2659.927847
7 PA03 2010-11-30 21:16:15 2020-04-21 02:58:22 3429.237581
8 PA04 2010-11-30 21:12:22 2020-12-21 06:42:53 3673.396192
9 PA05 2010-12-01 16:35:21 2020-12-22 06:20:01 3673.572685
10 PA06 2010-11-30 21:00:00 2013-10-27 21:57:07 1062.039664
11 PA07 2013-02-02 03:16:39 2020-12-19 21:16:25 2877.749838
12 PA10 2018-02-14 10:48:40 2020-12-22 04:06:49 1041.720937
13 PA11 2018-05-10 21:31:39 2020-12-21 18:10:47 955.860509
[66]: s.sort_values(by=['min'])
[69]: shsiop
30
PA04 2010-11-30 21:12:22 2020-12-21 06:42:53 3673.396192
PA05 2010-12-01 16:35:21 2020-12-22 06:20:01 3673.572685
PA07 2013-02-02 03:16:39 2020-12-19 21:16:25 2877.749838
PA10 2018-02-14 10:48:40 2020-12-22 04:06:49 1041.720937
PA11 2018-05-10 21:31:39 2020-12-21 18:10:47 955.860509
[70]: shnop
[71]: t = df.groupby(['Truck']).TimeArrived.agg({'min','max'})
[72]: t = t.sort_values(by=['min'])
[74]: t.reset_index()
31
21 CA56 2010-12-01 01:44:16 2020-12-22 03:59:33 3674.093947
22 CA01 2010-12-01 01:55:19 2010-12-10 05:39:18 9.155544
23 CA11 2010-12-01 02:00:42 2010-12-09 16:50:16 8.617755
24 CA08 2010-12-01 02:07:33 2010-12-22 08:11:40 21.252859
25 CA88 2010-12-01 02:15:29 2020-12-21 20:49:40 3673.773738
26 CA57 2010-12-01 02:15:44 2020-12-21 11:46:54 3673.396644
27 CA77 2010-12-01 02:31:17 2020-12-22 03:39:02 3674.047049
28 CA69 2010-12-01 03:36:37 2020-12-21 17:27:51 3673.577245
29 CA61 2010-12-01 04:21:01 2020-12-22 06:11:17 3674.076574
30 CA82 2010-12-01 07:01:44 2020-12-21 12:43:30 3673.237338
31 CA76 2010-12-01 09:01:08 2020-12-21 15:52:58 3673.285995
32 CA66 2010-12-01 11:52:39 2020-12-21 22:21:19 3673.436574
33 CA73 2010-12-01 12:58:59 2020-12-21 16:21:07 3673.140370
34 CA28 2010-12-01 13:30:34 2012-08-18 13:45:48 626.010579
35 CA84 2010-12-01 15:52:36 2020-12-21 18:01:34 3673.089560
36 CA70 2010-12-01 18:45:41 2020-12-22 05:54:04 3673.464155
37 CA30 2010-12-01 19:48:35 2014-01-12 09:51:17 1137.585208
38 CA71 2010-12-02 08:43:35 2014-09-05 20:40:26 1373.497813
39 CA55 2010-12-02 09:17:31 2020-12-21 14:23:13 3672.212292
40 CA63 2010-12-02 10:38:06 2020-12-21 15:57:07 3672.221539
41 CA60 2010-12-02 21:37:12 2020-12-21 17:24:42 3671.824653
42 CA53 2010-12-07 08:03:34 2020-12-21 19:22:04 3667.471181
43 CA78 2010-12-08 21:00:00 2020-12-21 22:30:23 3666.062766
44 CA65 2010-12-18 00:49:27 2020-12-21 18:43:38 3656.745961
45 CA87 2011-01-06 05:58:38 2020-12-19 19:20:36 3635.556921
46 CA58 2011-01-09 13:24:52 2020-12-21 17:41:15 3634.178044
47 CA90 2012-09-07 20:06:14 2020-12-22 00:21:21 3027.177164
48 CA91 2012-09-18 13:45:51 2020-12-20 22:45:26 3015.374711
49 CA92 2012-10-04 10:37:24 2020-12-21 16:24:01 3000.240706
50 CA93 2013-03-16 19:56:07 2020-12-21 19:37:07 2836.986806
51 CA94 2013-03-30 22:58:31 2020-12-22 06:07:05 2823.297616
52 CA95 2013-04-13 18:51:47 2020-12-22 05:23:18 2809.438553
53 CA96 2013-04-23 19:01:56 2020-12-19 23:44:18 2797.196088
54 CA97 2013-05-01 22:21:31 2020-12-21 12:43:53 2790.598866
55 CA98 2013-05-19 18:55:12 2020-12-21 20:48:26 2773.078634
56 CA99 2013-06-05 19:40:51 2020-12-22 00:39:38 2756.207488
57 CA100 2014-02-02 23:03:13 2020-12-22 05:21:28 2514.262674
58 CA101 2014-02-12 13:15:51 2020-12-22 03:24:19 2504.589213
59 CA102 2014-02-20 19:35:55 2020-12-22 04:02:50 2496.352025
60 CA103 2015-04-23 00:08:14 2020-12-22 06:20:01 2070.258183
61 CA105 2017-04-26 19:09:10 2020-12-22 03:11:45 1335.335127
62 CA104 2017-04-27 01:14:59 2020-12-22 02:18:24 1335.044039
63 CA107 2017-07-26 22:44:57 2020-12-22 00:37:49 1244.078380
64 CA106 2017-10-12 04:00:52 2020-12-21 18:19:53 1166.596539
32
[76]: trnop = t.query("max < '2020-01-01 00:00:00'")
[77]: trnop
[78]: trsiop
33
CA73 2010-12-01 12:58:59 2020-12-21 16:21:07 3673.140370
CA84 2010-12-01 15:52:36 2020-12-21 18:01:34 3673.089560
CA70 2010-12-01 18:45:41 2020-12-22 05:54:04 3673.464155
CA55 2010-12-02 09:17:31 2020-12-21 14:23:13 3672.212292
CA63 2010-12-02 10:38:06 2020-12-21 15:57:07 3672.221539
CA60 2010-12-02 21:37:12 2020-12-21 17:24:42 3671.824653
CA53 2010-12-07 08:03:34 2020-12-21 19:22:04 3667.471181
CA78 2010-12-08 21:00:00 2020-12-21 22:30:23 3666.062766
CA65 2010-12-18 00:49:27 2020-12-21 18:43:38 3656.745961
CA87 2011-01-06 05:58:38 2020-12-19 19:20:36 3635.556921
CA58 2011-01-09 13:24:52 2020-12-21 17:41:15 3634.178044
CA90 2012-09-07 20:06:14 2020-12-22 00:21:21 3027.177164
CA91 2012-09-18 13:45:51 2020-12-20 22:45:26 3015.374711
CA92 2012-10-04 10:37:24 2020-12-21 16:24:01 3000.240706
CA93 2013-03-16 19:56:07 2020-12-21 19:37:07 2836.986806
CA94 2013-03-30 22:58:31 2020-12-22 06:07:05 2823.297616
CA95 2013-04-13 18:51:47 2020-12-22 05:23:18 2809.438553
CA96 2013-04-23 19:01:56 2020-12-19 23:44:18 2797.196088
CA97 2013-05-01 22:21:31 2020-12-21 12:43:53 2790.598866
CA98 2013-05-19 18:55:12 2020-12-21 20:48:26 2773.078634
CA99 2013-06-05 19:40:51 2020-12-22 00:39:38 2756.207488
CA100 2014-02-02 23:03:13 2020-12-22 05:21:28 2514.262674
CA101 2014-02-12 13:15:51 2020-12-22 03:24:19 2504.589213
CA102 2014-02-20 19:35:55 2020-12-22 04:02:50 2496.352025
CA103 2015-04-23 00:08:14 2020-12-22 06:20:01 2070.258183
CA105 2017-04-26 19:09:10 2020-12-22 03:11:45 1335.335127
CA104 2017-04-27 01:14:59 2020-12-22 02:18:24 1335.044039
CA107 2017-07-26 22:44:57 2020-12-22 00:37:49 1244.078380
CA106 2017-10-12 04:00:52 2020-12-21 18:19:53 1166.596539
[79]: print("Palas INS: %d Palas OOS: %d Camiones INS: %d, Camiones OOS: %d"%(shsiop.
,→shape[0], shnop.shape[0], trsiop.shape[0], trnop.shape[0]))
[80]: # 'OpCAEX'
optr = df.groupby(['OpCAEX']).TimeArrived.agg({'min','max'})
optrSI = optr.query("max >= '2020-01-01 00:00:00'")
optrNO = optr.query("max < '2020-01-01 00:00:00'")
[82]: optrSI
34
0001 2011-02-15 14:54:35 2020-11-22 18:34:36
0002 2020-06-07 18:09:24 2020-06-07 18:09:24
0046 2010-12-22 21:47:05 2020-12-08 23:54:46
0069 2020-07-16 03:39:24 2020-12-15 14:57:52
0070 2010-11-30 21:34:21 2020-12-04 20:31:05
... ... ...
9782 2012-01-07 01:44:05 2020-12-15 15:06:47
9795 2010-12-05 12:23:17 2020-12-21 16:32:17
9922 2017-04-13 17:33:45 2020-12-19 16:46:58
9949 2014-06-15 02:21:40 2020-12-21 06:33:56
mmsunk 2010-11-30 21:00:00 2020-12-20 21:00:00
[83]: optrNO
[84]: # 'OpSHV',
opsh = df.groupby(['OpSHV']).TimeArrived.agg({'min','max'})
opshSI = opsh.query("max >= '2020-01-01 00:00:00'")
opshNO = opsh.query("max < '2020-01-01 00:00:00'")
[86]: opshSI
35
0070 2012-10-08 23:09:09 2020-12-06 17:14:07
0157 2010-12-02 18:49:10 2020-12-15 06:55:41
0406 2020-01-23 00:56:37 2020-07-12 22:22:23
0467 2020-06-13 17:36:52 2020-06-13 19:37:10
0676 2010-12-09 16:53:34 2020-12-11 05:05:30
0812 2017-06-17 22:58:31 2020-11-28 23:50:59
0954 2013-07-23 19:44:24 2020-11-30 13:57:30
0964 2011-01-07 07:02:03 2020-12-15 10:04:53
1022 2010-12-01 11:17:48 2020-12-21 06:42:53
1149 2011-03-07 05:34:21 2020-11-30 22:03:52
1155 2012-10-27 10:15:05 2020-12-15 20:48:52
1180 2010-12-02 21:25:07 2020-12-22 04:06:49
1222 2016-09-16 10:16:25 2020-12-07 11:52:40
1228 2016-05-02 23:13:52 2020-12-08 07:22:54
1317 2011-12-03 00:43:44 2020-05-26 12:37:37
1375 2017-07-27 23:16:29 2020-12-12 23:20:33
1750 2010-12-23 14:42:31 2020-12-15 20:51:10
1815 2011-07-02 03:18:08 2020-12-21 16:55:54
2044 2010-12-01 09:40:19 2020-12-21 13:29:17
2550 2010-12-01 16:35:21 2020-12-21 20:52:42
2902 2010-12-02 04:22:54 2020-12-21 07:06:44
3185 2010-12-09 01:46:45 2020-12-15 15:12:07
3655 2016-02-04 18:22:21 2020-12-08 20:42:31
3673 2016-09-12 02:16:46 2020-07-27 20:50:16
3707 2019-09-18 21:38:16 2020-11-01 11:27:32
3902 2016-08-11 01:09:39 2020-02-19 02:39:04
4055 2013-12-09 07:28:04 2020-11-28 23:00:54
4091 2010-12-08 13:57:11 2020-12-15 08:39:52
4243 2010-11-30 21:34:21 2020-12-22 06:20:01
4344 2017-10-10 10:49:13 2020-11-28 19:08:59
4374 2012-12-13 17:52:13 2020-12-13 05:38:57
5001 2010-12-03 15:28:42 2020-12-21 20:48:26
5329 2010-12-03 16:58:36 2020-12-21 09:34:55
5384 2010-12-07 21:25:14 2020-12-15 13:39:03
5418 2015-09-12 04:48:40 2020-08-21 11:26:51
5469 2010-12-07 21:33:38 2020-11-22 16:38:49
5477 2011-01-12 12:49:04 2020-12-21 05:43:43
5865 2010-12-21 21:27:15 2020-12-01 16:33:55
5920 2012-05-02 01:42:07 2020-12-19 19:17:14
6423 2010-12-01 09:42:21 2020-12-21 19:44:07
6584 2011-01-03 12:10:45 2020-05-11 17:04:00
6668 2016-12-11 17:54:11 2020-12-22 06:28:04
6696 2017-06-17 20:44:32 2020-11-28 20:54:06
6733 2010-12-08 16:05:42 2020-12-15 08:37:11
6852 2012-04-20 08:39:26 2020-12-20 08:50:06
7377 2018-09-30 20:38:55 2020-12-08 01:49:23
7381 2011-02-13 10:00:30 2020-11-24 05:43:09
36
7514 2010-12-08 09:18:12 2020-03-09 08:48:07
7648 2010-12-01 09:33:31 2020-12-21 18:43:38
7948 2020-09-04 21:58:03 2020-09-06 23:18:11
8256 2016-03-09 00:53:53 2020-12-08 22:26:22
8261 2020-06-18 07:28:44 2020-08-30 14:02:04
8715 2010-12-01 21:30:09 2020-04-27 16:56:50
8882 2012-07-06 16:02:43 2020-12-15 13:56:53
8974 2011-08-12 02:01:02 2020-12-18 02:56:43
8997 2017-04-28 11:04:30 2020-12-07 20:50:47
9108 2010-12-02 16:43:03 2020-12-16 20:53:24
9579 2014-04-13 07:32:17 2020-12-15 02:43:32
9670 2013-03-25 08:03:30 2020-11-24 05:58:10
9922 2017-04-28 06:19:11 2020-12-16 13:55:10
mmsunk 2010-11-30 21:00:00 2020-12-21 21:21:29
[87]: opshNO
37
5254 2016-03-14 16:03:47 2016-03-14 16:27:24
6039 2010-12-19 09:22:10 2013-02-21 05:48:48
6310 2015-10-24 05:15:08 2017-10-24 01:19:36
6373 2010-12-01 20:02:54 2018-06-10 17:44:20
6458 2013-08-16 11:56:54 2018-08-26 08:47:59
6574 2017-11-14 09:41:18 2017-12-25 00:43:21
6586 2010-12-01 21:40:35 2018-11-25 05:51:14
6825 2010-12-25 03:18:45 2017-12-17 06:46:31
7278 2017-11-11 01:26:04 2018-11-23 20:28:25
7283 2012-05-11 00:59:14 2016-07-18 08:59:36
7451 2011-01-21 17:36:22 2019-09-07 12:39:29
7513 2016-01-16 21:27:50 2016-01-16 21:40:37
7645 2010-11-30 21:17:34 2010-12-02 08:49:15
7657 2012-12-08 01:13:44 2019-01-25 05:23:55
7945 2017-12-08 18:22:43 2017-12-24 03:30:07
8070 2011-09-15 10:27:37 2017-12-13 08:57:16
8225 2015-11-09 04:59:55 2016-05-08 16:38:19
8428 2010-12-02 21:55:18 2012-01-12 16:51:52
8542 2010-12-09 04:26:44 2017-12-29 08:56:09
8657 2010-12-07 21:45:03 2018-12-17 18:48:14
8719 2010-12-20 19:00:35 2015-09-23 05:51:33
8751 2012-11-04 20:36:36 2013-10-18 23:38:21
8880 2012-03-15 22:42:39 2012-03-16 08:57:47
8987 2011-06-29 21:55:41 2011-06-30 00:34:02
9232 2010-12-01 15:33:32 2018-04-30 06:17:39
9342 2011-01-22 02:37:22 2017-08-25 04:59:27
9378 2011-04-16 12:33:11 2016-07-05 15:43:01
9826 2010-12-09 00:14:26 2019-12-15 16:49:59
9850 2012-02-17 02:34:14 2017-11-06 20:49:08
[88]: print("Opers CAEX INS: %d Opers CAEX OOS: %d Opers SHOVEL INS: %d Opers SHOVEL␣
,→OOS: %d"%(optrSI.shape[0], optrNO.shape[0], opshSI.shape[0], opshNO.shape[0]))
Opers CAEX INS: 293 Opers CAEX OOS: 163 Opers SHOVEL INS: 64 Opers SHOVEL OOS:
57
[90]: velop
38
... ... ... ... ...
9850 2.65 21.264105 22.48 27.83
9917 2.65 21.798007 22.44 43.34
9922 13.80 20.139268 21.01 25.82
9949 10.47 20.733605 21.33 27.33
mmsunk 2.65 21.325989 22.33 47.08
[92]: idxmi
[93]: print(velop[idxmi[0]:])
[95]: idxma
[96]: print(velop[idxma[0]:])
39
3646 6.55 21.565922 23.030 32.21
3655 2.67 21.467263 22.770 27.50
... ... ... ... ...
9850 2.65 21.264105 22.480 27.83
9917 2.65 21.798007 22.440 43.34
9922 13.80 20.139268 21.010 25.82
9949 10.47 20.733605 21.330 27.33
mmsunk 2.65 21.325989 22.330 47.08
40
OP04 2016-09-21 19:35:24 2016-09-21 19:35:24 0.000000
CH_3 2016-12-16 14:21:18 2017-01-28 14:28:25 43.004942
F10E 2018-02-16 08:04:53 2018-12-31 21:32:59 318.561181
F9SE 2018-05-19 01:11:38 2020-12-21 18:10:47 947.707743
F11W 2020-02-13 21:17:45 2020-08-21 22:19:37 190.042963
41
3245 2010-11-30 21:16:15 2015-04-06 10:33:13 1587.553449
2885 2010-12-01 11:17:48 2018-05-18 03:46:39 2724.686701
3275 2010-12-01 16:35:21 2020-12-18 14:07:54 3669.897604
... ... ... ...
2772 2020-07-26 19:26:40 2020-10-09 13:23:50 74.748032
2765 2020-08-13 23:57:56 2020-11-17 06:52:28 95.287870
3150 2020-09-09 11:34:35 2020-12-09 18:59:09 91.308727
2757 2020-11-14 00:59:21 2020-12-22 06:28:04 38.228275
3210 2020-12-08 22:17:28 2020-12-13 18:12:53 4.830150
[105]: df.head(10)
42
2 2020-12-22 06:11:17 CA61 CH-02 STOC-2930-00/MM1 PA05 287.0
3 2020-12-22 06:07:05 CA94 CH-02 STOC-2930-00/MM1 PA05 269.0
4 2020-12-22 05:54:04 CA70 CH-02 STOC-2930-00/MM1 PA05 318.0
5 2020-12-22 05:49:53 CA86 CH-1 STOC-2930-00/MM1 PA05 261.0
6 2020-12-22 05:46:01 CA103 CH-02 STOC-2930-00/MM1 PA05 294.0
7 2020-12-22 05:32:54 CA83 CH-1 F7R1-2757-02/MP2 CF10 305.0
8 2020-12-22 05:29:24 CA103 CH-02 STOC-2930-00/MM1 PA05 272.0
9 2020-12-22 05:23:18 CA95 CH-02 STOC-2930-00/MM1 PA05 314.0
[107]: df
43
2141617 2010-11-30 21:06:09 CA09 CH-02 STOC-3095-02/MM1 PA06 212.0
2141618 2010-11-30 21:00:00 CA72 CH-02 STOC-3095-02/MM1 PA06 304.0
2141619 2010-11-30 21:00:00 CA29 CH-1 STOC-3095-02/MM1 PA06 303.0
2141620 2010-11-30 21:00:00 CA74 CH-1 STOC-3095-02/MM1 PA06 304.0
[109]: tviaje
44
2018 0.500000 13.896893 14.433330 244.38330
2019 0.933333 14.440410 13.916670 176.15000
2020 0.766667 16.033147 14.283330 125.40000
[111]: tfase.sort_index(inplace=True)
[112]: tfase
45
SM-A 1.883333 6.092091 5.883333 29.850000
STOC 2.766667 8.649688 5.950000 33.500000
2014 F10N 0.716667 24.766733 23.216670 83.016670
F5SW 13.550000 13.785632 13.550000 14.150000
F6NE 1.483333 9.569675 9.616667 56.116660
F7DE 0.333333 7.046135 6.766667 68.233330
F7DN 7.316667 7.810378 7.916667 8.683333
F7DW 0.783333 8.711853 8.900000 51.083330
F7NE 0.733333 5.384588 5.033333 69.316670
F7NW 8.350000 16.672223 8.350000 33.316670
F8NE 1.033333 6.064710 5.366667 54.616660
F9NW 11.100000 24.024053 24.500000 25.466670
F9PD 4.783333 4.783333 4.783333 4.783333
POLI 8.700000 9.100000 9.300000 9.300000
SM-A 1.033333 3.691833 3.516667 48.066670
STOC 0.516667 8.411961 6.966667 70.633330
2015 F10N 0.133333 25.657162 24.466670 139.516700
F6NE 1.266667 8.804618 8.733334 52.366660
F6SW 1.083333 10.169895 9.500000 73.100000
F7DE 1.000000 7.402948 6.516667 68.833340
F7DW 0.366667 8.083917 7.283333 96.983330
F7NE 2.600000 9.686597 12.133330 61.466670
F8NE 0.533333 5.845189 4.966667 89.016670
F8SE 1.083333 3.940164 3.766667 6.833333
RELL 4.283333 6.715823 6.566667 9.250000
SM-A 3.000000 3.594136 3.433333 5.633333
STOC 0.333333 7.812250 4.366667 80.983330
VENT 3.566667 3.841667 3.841667 4.116667
2016 CASE 1.116667 3.005451 3.000000 13.850000
CH_3 3.416667 3.416667 3.416667 3.416667
F10N 0.750000 22.022711 20.050000 95.100000
F7DW 1.033333 6.361630 6.166667 60.916670
F7R1 0.233333 6.216798 6.183333 74.533330
F8NE 1.050000 6.903034 6.716667 64.416660
OP04 22.016670 22.016670 22.016670 22.016670
STOC 0.733333 7.906810 6.400000 64.383330
VENT 2.966667 3.685379 3.566667 5.550000
2017 CH_3 3.416667 3.416667 3.416667 3.416667
F10N 0.583333 18.562358 17.683330 109.583300
F7R1 0.283333 8.205488 8.183333 73.200000
F8NE 6.166667 8.351394 7.933333 39.833330
STOC 0.416667 6.112060 4.266667 48.550000
2018 F10E 8.366667 16.549612 16.050000 60.233330
F10N 1.200000 16.624713 15.966670 93.750000
F7R1 1.366667 12.088320 12.166670 244.383300
F9PD 10.900000 10.900000 10.900000 10.900000
F9SE 1.950000 13.513334 13.783330 28.566670
46
STOC 0.500000 4.525952 3.916667 64.233330
2019 F10N 0.933333 13.978458 13.633330 176.150000
F7R1 2.733333 14.786083 14.600000 116.816700
F9SE 2.866667 25.697110 24.566670 110.633300
STOC 1.166667 5.108507 4.100000 82.566670
2020 F10N 1.200000 13.014895 13.500000 59.416670
F11W 10.383330 13.137500 13.816670 14.533330
F7R1 1.200000 16.658428 16.500000 80.516670
F9SE 1.200000 27.364230 27.083330 125.400000
STOC 0.766667 4.576475 3.383333 80.783330
[114]: display(tposOD)
[ ]:
47