import tensorflow as tf
from tensorflow.keras import layers, models
from tensorflow.keras.callbacks import EarlyStopping
# Sample simplified model for document layout analysis
model = models.Sequential([
layers.Conv2D(32, (3,3), activation='relu', input_shape=(256, 256, 3)),
layers.MaxPooling2D(2,2),
layers.Dropout(0.3),
layers.Conv2D(64, (3,3), activation='relu'),
layers.MaxPooling2D(2,2),
layers.Dropout(0.3),
layers.Flatten(),
layers.Dense(128, activation='relu'),
layers.Dropout(0.4),
layers.Dense(5, activation='softmax') # 5 classes: title, paragraph, image, table, other
])
model.compile(optimizer=tf.keras.optimizers.Adam(learning_rate=0.0005),
loss='sparse_categorical_crossentropy',
metrics=['accuracy'])
# Early stopping to stop training when validation loss stops improving
early_stop = EarlyStopping(monitor='val_loss', patience=5, restore_best_weights=True)
# Assuming X_train, y_train, X_val, y_val are prepared image and label datasets
# model.fit(X_train, y_train, epochs=50, batch_size=32, validation_data=(X_val, y_val), callbacks=[early_stop])