Change Order Analysis

Overview

This skill implements machine learning-based change order analysis for construction projects. Predict change order costs, classify types, identify patterns in historical data, and streamline approval processes.

Capabilities:

Change order classification
Cost impact prediction
Schedule impact analysis
Pattern identification
Root cause analysis
Approval workflow optimization

Quick Start

from dataclasses import dataclass, field from datetime import date, datetime from typing import List, Dict, Optional from enum import Enum

class ChangeOrderType(Enum): DESIGN_CHANGE = "design_change" OWNER_REQUEST = "owner_request" FIELD_CONDITION = "field_condition" CODE_COMPLIANCE = "code_compliance" VALUE_ENGINEERING = "value_engineering" ERROR_OMISSION = "error_omission" SCOPE_CHANGE = "scope_change"

class ChangeOrderStatus(Enum): DRAFT = "draft" SUBMITTED = "submitted" UNDER_REVIEW = "under_review" APPROVED = "approved" REJECTED = "rejected" IMPLEMENTED = "implemented"

@dataclass class ChangeOrder: co_number: str title: str description: str co_type: ChangeOrderType status: ChangeOrderStatus submitted_date: date requested_by: str cost_impact: float schedule_impact_days: int affected_elements: List[str] = field(default_factory=list)

def classify_change_order(description: str) -> ChangeOrderType: """Simple rule-based classification""" description_lower = description.lower()

if any(word in description_lower for word in ['design', 'drawing', 'specification']):
    return ChangeOrderType.DESIGN_CHANGE
elif any(word in description_lower for word in ['owner', 'client', 'request']):
    return ChangeOrderType.OWNER_REQUEST
elif any(word in description_lower for word in ['site', 'field', 'condition', 'unforeseen']):
    return ChangeOrderType.FIELD_CONDITION
elif any(word in description_lower for word in ['code', 'regulation', 'compliance']):
    return ChangeOrderType.CODE_COMPLIANCE
elif any(word in description_lower for word in ['value', 'alternative', 'savings']):
    return ChangeOrderType.VALUE_ENGINEERING
elif any(word in description_lower for word in ['error', 'omission', 'mistake']):
    return ChangeOrderType.ERROR_OMISSION
else:
    return ChangeOrderType.SCOPE_CHANGE

Example

co = ChangeOrder( co_number="CO-001", title="Additional structural reinforcement", description="Site conditions revealed weaker soil requiring additional foundation reinforcement", co_type=classify_change_order("Site conditions revealed weaker soil"), status=ChangeOrderStatus.SUBMITTED, submitted_date=date.today(), requested_by="Site Engineer", cost_impact=50000, schedule_impact_days=5 ) print(f"CO Type: {co.co_type.value}")

Comprehensive Change Order System

Change Order Management

from dataclasses import dataclass, field from datetime import date, datetime, timedelta from typing import List, Dict, Optional, Tuple from enum import Enum import pandas as pd import numpy as np

class ImpactSeverity(Enum): MINOR = "minor" # < 1% cost, < 1 week schedule MODERATE = "moderate" # 1-5% cost, 1-4 weeks schedule MAJOR = "major" # 5-10% cost, 1-3 months schedule CRITICAL = "critical" # > 10% cost, > 3 months schedule

@dataclass class CostBreakdown: labor: float = 0 materials: float = 0 equipment: float = 0 subcontractor: float = 0 overhead: float = 0 profit: float = 0

@property
def total(self) -> float:
    return self.labor + self.materials + self.equipment + self.subcontractor + self.overhead + self.profit

@dataclass class ScheduleImpact: direct_days: int ripple_days: int critical_path_affected: bool affected_activities: List[str] = field(default_factory=list)

@property
def total_days(self) -> int:
    return self.direct_days + self.ripple_days

@dataclass class ChangeOrderDetail: co_id: str co_number: str title: str description: str justification: str

# Classification
co_type: ChangeOrderType
initiated_by: str  # owner, contractor, designer, etc.
responsibility: str  # who pays

# Status
status: ChangeOrderStatus
submitted_date: date
approved_date: Optional[date] = None
implemented_date: Optional[date] = None

# Impact
cost_breakdown: CostBreakdown = field(default_factory=CostBreakdown)
schedule_impact: ScheduleImpact = None
severity: ImpactSeverity = ImpactSeverity.MINOR

# Affected scope
affected_elements: List[str] = field(default_factory=list)
affected_drawings: List[str] = field(default_factory=list)
affected_specs: List[str] = field(default_factory=list)

# Supporting documents
attachments: List[str] = field(default_factory=list)
related_rfis: List[str] = field(default_factory=list)
related_cos: List[str] = field(default_factory=list)

# Approval
approvals: List[Dict] = field(default_factory=list)
comments: List[Dict] = field(default_factory=list)

class ChangeOrderManager: """Manage project change orders"""

def __init__(self, project_id: str, contract_value: float):
    self.project_id = project_id
    self.contract_value = contract_value
    self.change_orders: Dict[str, ChangeOrderDetail] = {}
    self.co_counter = 0

def create_change_order(self, title: str, description: str,
                       co_type: ChangeOrderType,
                       initiated_by: str) -> ChangeOrderDetail:
    """Create new change order"""
    self.co_counter += 1
    co_id = f"CO-{self.project_id}-{self.co_counter:04d}"

    co = ChangeOrderDetail(
        co_id=co_id,
        co_number=f"CO-{self.co_counter:04d}",
        title=title,
        description=description,
        justification="",
        co_type=co_type,
        initiated_by=initiated_by,
        responsibility="TBD",
        status=ChangeOrderStatus.DRAFT,
        submitted_date=date.today()
    )

    self.change_orders[co_id] = co
    return co

def update_cost(self, co_id: str, cost_breakdown: CostBreakdown):
    """Update change order cost"""
    co = self.change_orders.get(co_id)
    if co:
        co.cost_breakdown = cost_breakdown
        co.severity = self._calculate_severity(co)

def update_schedule_impact(self, co_id: str, impact: ScheduleImpact):
    """Update schedule impact"""
    co = self.change_orders.get(co_id)
    if co:
        co.schedule_impact = impact
        co.severity = self._calculate_severity(co)

def _calculate_severity(self, co: ChangeOrderDetail) -> ImpactSeverity:
    """Calculate change order severity"""
    cost_pct = co.cost_breakdown.total / self.contract_value * 100
    schedule_days = co.schedule_impact.total_days if co.schedule_impact else 0

    if cost_pct > 10 or schedule_days > 90:
        return ImpactSeverity.CRITICAL
    elif cost_pct > 5 or schedule_days > 30:
        return ImpactSeverity.MAJOR
    elif cost_pct > 1 or schedule_days > 7:
        return ImpactSeverity.MODERATE
    else:
        return ImpactSeverity.MINOR

def submit_for_approval(self, co_id: str):
    """Submit change order for approval"""
    co = self.change_orders.get(co_id)
    if co and co.status == ChangeOrderStatus.DRAFT:
        co.status = ChangeOrderStatus.SUBMITTED
        co.submitted_date = date.today()

def approve(self, co_id: str, approver: str, comments: str = ""):
    """Approve change order"""
    co = self.change_orders.get(co_id)
    if co:
        co.approvals.append({
            'approver': approver,
            'action': 'approved',
            'date': date.today().isoformat(),
            'comments': comments
        })
        co.status = ChangeOrderStatus.APPROVED
        co.approved_date = date.today()

def get_summary(self) -> Dict:
    """Get change order summary"""
    if not self.change_orders:
        return {'message': 'No change orders'}

    total_cost = sum(co.cost_breakdown.total for co in self.change_orders.values())
    total_schedule = sum(
        co.schedule_impact.total_days if co.schedule_impact else 0
        for co in self.change_orders.values()
    )

    by_type = {}
    by_status = {}
    by_severity = {}

    for co in self.change_orders.values():
        t = co.co_type.value
        by_type[t] = by_type.get(t, 0) + co.cost_breakdown.total

        s = co.status.value
        by_status[s] = by_status.get(s, 0) + 1

        sev = co.severity.value
        by_severity[sev] = by_severity.get(sev, 0) + 1

    return {
        'total_change_orders': len(self.change_orders),
        'total_cost_impact': total_cost,
        'cost_impact_pct': total_cost / self.contract_value * 100,
        'total_schedule_impact_days': total_schedule,
        'by_type': by_type,
        'by_status': by_status,
        'by_severity': by_severity
    }

ML Classification and Prediction

from sklearn.ensemble import RandomForestClassifier, GradientBoostingRegressor from sklearn.feature_extraction.text import TfidfVectorizer from sklearn.model_selection import train_test_split from sklearn.preprocessing import LabelEncoder import pandas as pd import numpy as np import joblib

class ChangeOrderPredictor: """ML-based change order classification and cost prediction"""

def __init__(self):
    self.type_classifier = None
    self.cost_predictor = None
    self.schedule_predictor = None
    self.vectorizer = TfidfVectorizer(max_features=500, ngram_range=(1, 2))
    self.type_encoder = LabelEncoder()
    self.is_trained = False

def train(self, historical_data: pd.DataFrame):
    """Train models on historical change order data

    Expected columns:
    - description: text description
    - co_type: change order type
    - cost_impact: cost in dollars
    - schedule_impact: days of delay
    - contract_value: original contract value
    - project_phase: phase when CO was raised
    - affected_elements_count: number of affected elements
    """
    # Prepare text features
    text_features = self.vectorizer.fit_transform(historical_data['description'])

    # Prepare numeric features
    numeric_features = historical_data[[
        'contract_value', 'affected_elements_count'
    ]].values

    # Combine features
    X = np.hstack([text_features.toarray(), numeric_features])

    # Train type classifier
    y_type = self.type_encoder.fit_transform(historical_data['co_type'])
    X_train, X_test, y_train, y_test = train_test_split(X, y_type, test_size=0.2)

    self.type_classifier = RandomForestClassifier(n_estimators=100, random_state=42)
    self.type_classifier.fit(X_train, y_train)

    type_accuracy = self.type_classifier.score(X_test, y_test)

    # Train cost predictor
    y_cost = historical_data['cost_impact'].values
    self.cost_predictor = GradientBoostingRegressor(n_estimators=100, random_state=42)
    self.cost_predictor.fit(X, y_cost)

    # Train schedule predictor
    y_schedule = historical_data['schedule_impact'].values
    self.schedule_predictor = GradientBoostingRegressor(n_estimators=100, random_state=42)
    self.schedule_predictor.fit(X, y_schedule)

    self.is_trained = True

    return {
        'type_classifier_accuracy': type_accuracy,
        'models_trained': True
    }

def predict(self, description: str, contract_value: float,
           affected_elements_count: int = 1) -> Dict:
    """Predict change order type and impacts"""
    if not self.is_trained:
        return {'error': 'Models not trained'}

    # Prepare features
    text_features = self.vectorizer.transform([description])
    numeric_features = np.array([[contract_value, affected_elements_count]])
    X = np.hstack([text_features.toarray(), numeric_features])

    # Predict type
    type_probs = self.type_classifier.predict_proba(X)[0]
    type_idx = np.argmax(type_probs)
    predicted_type = self.type_encoder.inverse_transform([type_idx])[0]

    # Predict cost
    predicted_cost = self.cost_predictor.predict(X)[0]

    # Predict schedule
    predicted_schedule = self.schedule_predictor.predict(X)[0]

    return {
        'predicted_type': predicted_type,
        'type_confidence': float(type_probs[type_idx]),
        'type_probabilities': {
            self.type_encoder.inverse_transform([i])[0]: float(p)
            for i, p in enumerate(type_probs)
        },
        'predicted_cost': float(max(0, predicted_cost)),
        'predicted_schedule_days': int(max(0, predicted_schedule)),
        'cost_as_pct_contract': float(predicted_cost / contract_value * 100)
    }

def save_models(self, path: str):
    """Save trained models"""
    joblib.dump({
        'type_classifier': self.type_classifier,
        'cost_predictor': self.cost_predictor,
        'schedule_predictor': self.schedule_predictor,
        'vectorizer': self.vectorizer,
        'type_encoder': self.type_encoder
    }, path)

def load_models(self, path: str):
    """Load trained models"""
    data = joblib.load(path)
    self.type_classifier = data['type_classifier']
    self.cost_predictor = data['cost_predictor']
    self.schedule_predictor = data['schedule_predictor']
    self.vectorizer = data['vectorizer']
    self.type_encoder = data['type_encoder']
    self.is_trained = True

Pattern Analysis

from collections import defaultdict from typing import List, Dict import pandas as pd

class ChangeOrderAnalyzer: """Analyze patterns in change orders"""

def __init__(self, change_orders: List[ChangeOrderDetail]):
    self.cos = change_orders
    self.df = self._to_dataframe()

def _to_dataframe(self) -> pd.DataFrame:
    """Convert change orders to DataFrame"""
    data = []
    for co in self.cos:
        data.append({
            'co_id': co.co_id,
            'co_type': co.co_type.value,
            'initiated_by': co.initiated_by,
            'cost': co.cost_breakdown.total,
            'schedule_days': co.schedule_impact.total_days if co.schedule_impact else 0,
            'submitted_date': co.submitted_date,
            'affected_elements': len(co.affected_elements),
            'severity': co.severity.value
        })
    return pd.DataFrame(data)

def analyze_by_type(self) -> Dict:
    """Analyze change orders by type"""
    if self.df.empty:
        return {}

    analysis = {}
    for co_type in self.df['co_type'].unique():
        type_df = self.df[self.df['co_type'] == co_type]
        analysis[co_type] = {
            'count': len(type_df),
            'total_cost': type_df['cost'].sum(),
            'avg_cost': type_df['cost'].mean(),
            'total_schedule_days': type_df['schedule_days'].sum(),
            'avg_schedule_days': type_df['schedule_days'].mean()
        }

    return analysis

def analyze_trends(self) -> Dict:
    """Analyze trends over time"""
    if self.df.empty:
        return {}

    self.df['month'] = pd.to_datetime(self.df['submitted_date']).dt.to_period('M')

    monthly = self.df.groupby('month').agg({
        'co_id': 'count',
        'cost': 'sum',
        'schedule_days': 'sum'
    }).rename(columns={'co_id': 'count'})

    return {
        'monthly_trend': monthly.to_dict(),
        'peak_month': monthly['count'].idxmax().strftime('%Y-%m'),
        'total_cost_trend': 'increasing' if monthly['cost'].is_monotonic_increasing else
                           'decreasing' if monthly['cost'].is_monotonic_decreasing else 'variable'
    }

def identify_root_causes(self) -> List[Dict]:
    """Identify common root causes"""
    if self.df.empty:
        return []

    # Analyze by initiator and type combination
    causes = self.df.groupby(['initiated_by', 'co_type']).agg({
        'co_id': 'count',
        'cost': 'sum'
    }).reset_index()

    causes = causes.sort_values('cost', ascending=False)

    return [
        {
            'initiator': row['initiated_by'],
            'type': row['co_type'],
            'frequency': row['co_id'],
            'total_cost': row['cost'],
            'recommendation': self._get_recommendation(row['initiated_by'], row['co_type'])
        }
        for _, row in causes.head(10).iterrows()
    ]

def _get_recommendation(self, initiator: str, co_type: str) -> str:
    """Generate recommendation based on pattern"""
    recommendations = {
        ('designer', 'design_change'): 'Improve design review process and BIM coordination',
        ('designer', 'error_omission'): 'Implement design quality checks and clash detection',
        ('owner', 'owner_request'): 'Define scope more clearly during planning phase',
        ('owner', 'scope_change'): 'Conduct thorough requirements gathering',
        ('contractor', 'field_condition'): 'Enhance site investigation before construction',
        ('contractor', 'value_engineering'): 'Include VE sessions earlier in project'
    }

    return recommendations.get(
        (initiator.lower(), co_type),
        'Review process and implement preventive measures'
    )

def calculate_risk_score(self) -> float:
    """Calculate overall change order risk score"""
    if self.df.empty:
        return 0

    # Factors:
    # - Frequency of COs
    # - Cost impact severity
    # - Schedule impact severity
    # - Trend direction

    co_rate = len(self.df) / 12  # COs per month (assuming 12 month project)
    avg_cost_impact = self.df['cost'].mean()
    avg_schedule_impact = self.df['schedule_days'].mean()

    # Normalize and weight
    freq_score = min(1, co_rate / 10) * 30  # Up to 30 points
    cost_score = min(1, avg_cost_impact / 50000) * 40  # Up to 40 points
    schedule_score = min(1, avg_schedule_impact / 30) * 30  # Up to 30 points

    return freq_score + cost_score + schedule_score

def generate_report(self, output_path: str) -> str:
    """Generate comprehensive analysis report"""
    with pd.ExcelWriter(output_path, engine='openpyxl') as writer:
        # Summary
        summary = pd.DataFrame([{
            'Total COs': len(self.cos),
            'Total Cost Impact': self.df['cost'].sum(),
            'Total Schedule Impact (days)': self.df['schedule_days'].sum(),
            'Risk Score': self.calculate_risk_score()
        }])
        summary.to_excel(writer, sheet_name='Summary', index=False)

        # By type
        pd.DataFrame(self.analyze_by_type()).T.to_excel(
            writer, sheet_name='By_Type'
        )

        # Root causes
        pd.DataFrame(self.identify_root_causes()).to_excel(
            writer, sheet_name='Root_Causes', index=False
        )

        # All COs
        self.df.to_excel(writer, sheet_name='All_COs', index=False)

    return output_path

Quick Reference

CO Type Typical Cause Prevention Strategy

Design Change Incomplete design BIM coordination, design reviews

Owner Request Changing requirements Clear scope definition

Field Condition Unforeseen site issues Thorough site investigation

Code Compliance Regulation changes Early code review

Value Engineering Cost savings opportunity VE workshops

Error/Omission Design mistakes QA/QC processes

Resources

AIA A201: General Conditions of the Contract
AGC ConsensusDocs: Change order management
DDC Website: https://datadrivenconstruction.io

Next Steps

See document-classification-nlp for CO document processing
See risk-assessment-ml for project risk analysis
See cost-prediction for cost estimation

change-order-analysis

Safety Notice

Copy this and send it to your AI assistant to learn

Example

Source Transparency

Related Skills

pandas-construction-analysis

data-evolution-analysis

bid-analysis-comparator

delay-analysis