Documente Academic
Documente Profesional
Documente Cultură
import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
"""
"""
site_id maintenance_typ category_cd status_cd closed_time_id
Closed_date required_time_id Required_date planned_end_time_id
Planned_date wo_count wo_ontime_count wo_late_count
wo_upcoming_count
0 265 BREAKDOWN REPAIR Asset Maintenance Orders COMPLETED 20170206
00:00.0 20170207 00:00.0 20170206 00:00.0 1 1 0
0
1 265 BREAKDOWN REPAIR Asset Maintenance Orders COMPLETED 20170206
00:00.0 20170207 00:00.0 20170206 00:00.0 1 1 0
0
2 334 PREDICTIVE TASK Asset Maintenance Orders CANCELLED 20170406
00:00.0 20170413 00:00.0 20170406 00:00.0 1 0 1
0
3 334 PREDICTIVE TASK Asset Maintenance Orders COMPLETED 20170408
00:00.0 20170413 00:00.0 20170406 00:00.0 1 1 0
0
4 324 CORRECTIVE TASK Asset Maintenance Orders COMPLETED 20170408
00:00.0 20170413 00:00.0 20170408 00:00.0 1 1 0
0
"""
"""
return pd.to_datetime(clm,format='%Y%m%d')
"""
COMPLETED 8727
CLOSED 3208
CANCELLED 158
Name: status_cd, dtype: int64
"""
"""
get the samples whos maintenance is completed
so that we can predict the date of complition of maintenance only for completed
sites
"""
data_completed = data_year[data_year['status_cd']=='COMPLETED']
data_completed['closed_day']=data_completed['closed_time_id'].map(lambda x:
x.dayofyear)
data_completed['required_time(day)']=data_completed['required_time_id'].map(lambda
x: x.dayofyear)
data_completed['planned_time(day)']=data_completed['planned_end_time_id'].map(lambd
a x: x.dayofyear)
data_new['site_id'].value_counts().count() #40
data_new['category_cd'].value_counts()
"""
Asset Maintenance Orders 5161
Sanitation Work Orders 1609
Integrated Pest Management 802
Safety Task Work Orders 385
Final Product Zone Order 365
Autonomous Maintenance 147
Food Safety 130
Pest Management Work Order 5
Environmental Task Work Orders 4
Capital Work Orders 4
COR - Corrective Maintenance Work Orders 2
Name: category_cd, dtype: int64
"""
y= data_new[ 'closed_day' ]
lm = LinearRegression()
"""
pred_train
array([109.07451724, 43.69171545, 54.58952948, ..., 46.84330053,
52.12862088, 57.95741627])
pred_test
array([ 73.39881804, 95.87136349, 82.24623855, ..., 90.58016066,
102.27159995, 98.12409611])
"""