Image classification with Python

# import all required Python packages: import skimage.io as io import numpy as np import os, shutil from sklearn.ensemble import AdaBoostClassifier, RandomForestClassifier, GradientBoostingClassifier, ExtraTreesClassifier from sklearn.externals import joblib # set up your directories with the MODIS data rootdir = "C:\\Data\\Raster\\MODIS\\" # path to your training data path_pix = "C:\\Data\\Samples\\" # path to your model path_model = "C:\\Data\\Models\\" # path to your classification results path_class = "C:\\Data\\Class\\" # declare a new function def training(): # path to your MODIS TIFF raster = rootdir + "modis_stack_ndvi.tif" # path to your corresponding pixel samples (training data) samples = path_pix + "samples_modis.tif" # read in MODIS raster img_ds = io.imread(raster) # convert to 16bit numpy array img = np.array(img_ds, dtype='int16') # do the same with your sample pixels roi_ds = io.imread(samples) roi = np.array(roi_ds, dtype='int8') # read in your labels labels = np.unique(roi[roi > 0]) print('The training data include {n} classes: {classes}'.format(n=labels.size, classes=labels)) # compose your X,Y data (dataset - training data) X = img[roi > 0, :] Y = roi[roi > 0] # assign class weights (class 1 has the weight 3, etc.) weights = {1:3, 2:2, 3:2, 4:2} # build your Random Forest Classifier # for more information: http://scikit-learn.org/stable/modules/generated/sklearn.ensemble.RandomForestClassifier.html rf = RandomForestClassifier(class_weight = weights, n_estimators = 100, criterion = 'gini', max_depth = 4, min_samples_split = 2, min_samples_leaf = 1, max_features = 'auto', bootstrap = True, oob_score = True, n_jobs = 1, random_state = None, verbose = True) # alternatively you may try out a Gradient Boosting Classifier # It is much less RAM consuming and considers weak training data """ rf = GradientBoostingClassifier(n_estimators = 300, min_samples_leaf = 1, min_samples_split = 4, max_depth = 4, max_features = 'auto', learning_rate = 0.8, subsample = 1, random_state = None, warm_start = True) """ # now fit your training data with the original dataset rf = rf.fit(X,Y) # export your Random Forest / Gradient Boosting Model model = path_model + "model.pkl" joblib.dump(rf, model) training()

def classification(): # Read worldfile of original dataset tfw_old = str(raster.split(".tif")[0]) + ".tfw" # Read Data img_ds = io.imread(raster) img = np.array(img_ds, dtype='int16') # call your random forest model rf = path_model + "model.pkl" clf = joblib.load(rf) # Classification of array and save as image (23 refers to the number of multitemporal NDVI bands in the stack) new_shape = (img.shape[0] * img.shape[1], img.shape[2]) img_as_array = img[:, :, :23].reshape(new_shape) class_prediction = clf.predict(img_as_array) class_prediction = class_prediction.reshape(img[:, :, 0].shape) # now export your classificaiton classification = path_class + "classification.tif" io.imsave(classification, class_prediction) # Assign Worldfile to classified image tfw_new = classification.split(".tif")[0] + ".tfw" shutil.copy(tfw_old, tfw_new) classification()

Successful Completion of UNIversInternational Certificate

In line with its internationalization strategy, the University of Würzburg supports administrative staff in their task of advising and supporting international students, guests, and academics. To this end, it has launched the "UNIversInternational" certificate...

The “Geolingual Studies” team visited the DLR EOC

The "Geolingual Studies" team of the University Würzburg visited the DLR-EOC on 3 and 4 July 2025. Geolingual Studies is an innovative area of research and teaching which takes a decisively applied linguistic approach and combines methodologies from linguistics,...

Course on Object-based image analysis

Dr. Michael Wurm from the German Aerospace Center (DLR) gave a class about Object-based image analysis (OBIA) using the eCognition Software for the EAGLE students. The course gives an insight into the theoretical basis of OBIA and using different datasets and tasks...

Strengthening Ties: Earth Observation Research Cluster Meets with DLR GZS Lecturers

Yesterday, members of our Earth Observation Research Cluster had the opportunity to connect with colleagues from DLR during the annual summer gathering of the DLR Earth Observation Center (EOC). The informal setting of the DLR EOC summer party provided a great...

PhD defense by Thilo Erbertseder

Thilo Erbertseder will defend his PhD thesis "Satellite-based analysis of NO2 air pollution: from global to urban aspect" on Wednesday 23rd of July at 3pm in John-Skilton Str. 4a, seminar room 1. All interested staff, students, family and friends are cordially invited...

upcoming PhD defense by Adomas Liepa

Our PhD student Adomas Liepa will defend his Phd "Potential of Satellite Earth Observation in seasonal monitoring of complex agricultural environments of East Africa" on Thursday 24th of July at 11am. The defense will take place at John Skilton Str. 4a, seminarroom 1....

Image classification with Python

Image classification with Python

News

March 3, 2016

Successful Completion of UNIversInternational Certificate

The “Geolingual Studies” team visited the DLR EOC

Course on Object-based image analysis

Strengthening Ties: Earth Observation Research Cluster Meets with DLR GZS Lecturers

PhD defense by Thilo Erbertseder

upcoming PhD defense by Adomas Liepa