python图像处理之sift-kmeans-SVM图像分类

网上有很多资料，参考：https://blog.csdn.net/u012874151/article/details/45457085/

原文代码在python3.0或者opencv版本不同下跑不通。

我这里做一些改动，自行参考，文笔有限。

改动点1：图像输入自定义，不再固定名称

改动点2：解决找不到sift、svm组件类型问题

改动点3：解决svm训练的标签错误问题

改动点4：解决导入不了svm模型问题

等

注意：SVM.train中标签一定要为整数类型

浮点数型数据不能强行转换成整数型，会导致数据错误，参考：https://blog.csdn.net/smileyuping/article/details/22100743

代码如下：

import cv2
import numpy as np
import os

TrainSetInfo = {
	\"car\"		:	40,
	\"city\"		:	20,
	\"dog\"		:	30,
	\"earth\"		:	15,
	\"fireworks\"	:	20,
	\"flowers\"	:	20,
	\"fruits\"	:	20,
	\"glass\"		:	20,
	\"gold\"		:	15,
	\"gun\"		:	20,
	\"plane\"		:	40,
	\"sky\"		:	30,
	\"worldcup\"	:	40
}

TestSetInfo = {
	\"car\"		:	119,
	\"city\"		:	59,
	\"dog\"		:	49,
	\"earth\"		:	24,
	\"fireworks\"	:	54,
	\"flowers\"	:	63,
	\"fruits\"	:	78,
	\"glass\"		:	52,
	\"gold\"		:	44,
	\"gun\"		:	44,
	\"plane\"		:	102,
	\"sky\"		:	78,
	\"worldcup\"	:	131
}

def calcSiftFeature(img):
	gray = cv2.cvtColor(img, cv2.COLOR_BGR2GRAY)
	sift = cv2.xfeatures2d.SIFT_create(200) # max number of SIFT points is 200
	kp, des = sift.detectAndCompute(gray, None)
	return des

def calcFeatVec(features, centers):
	featVec = np.zeros((1, 50))
	for i in range(0, features.shape[0]):
		fi = features[i]
		diffMat = np.tile(fi, (50, 1)) - centers
		sqSum = (diffMat**2).sum(axis=1)
		dist = sqSum**0.5
		sortedIndices = dist.argsort()
		idx = sortedIndices[0] # index of the nearest center
		featVec[0][idx] += 1	
	return featVec

def initFeatureSet():
	for name, count in TrainSetInfo.items():
		# dir = \"D:/GJAI_data/gongjingai_pre/train_1-2-3/\" + name + \"/\"
		dir = \"TrainSet/\" + name + \"/\"
		featureSet = np.float32([]).reshape(0,128)

		print(\"Extract features from training set \" + name + \"...\")
		pathDir = os.listdir(dir)
		for i in pathDir:
			filename = os.path.join(\'%s%s\' % (dir, i))
			img = cv2.imread(filename)
			des = calcSiftFeature(img)
			featureSet = np.append(featureSet, des, axis=0)
		
		featCnt = featureSet.shape[0]
		print(str(featCnt) + \" features in \" + str(count) + \" images\\n\")
		
		# save featureSet to file
		filename = \"Temp1/features/\" + name + \".npy\"
		np.save(filename, featureSet)

def learnVocabulary():
	wordCnt = 50
	for name, count in TrainSetInfo.items():
		filename = \"Temp1/features/\" + name + \".npy\"
		features = np.load(filename)
		
		print(\"Learn vocabulary of \" + name + \"...\")
		# use k-means to cluster a bag of features
		criteria = (cv2.TERM_CRITERIA_EPS + cv2.TERM_CRITERIA_MAX_ITER, 20, 0.1)
		flags = cv2.KMEANS_RANDOM_CENTERS
		compactness, labels, centers = cv2.kmeans(features, wordCnt,None, criteria, 20, flags)
		
		# save vocabulary(a tuple of (labels, centers)) to file
		filename = \"Temp1/vocabulary/\" + name + \".npy\"
		np.save(filename, (labels, centers))
		print(\"Done\\n\")

def trainClassifier():
	trainData = np.float32([]).reshape(0, 50)
	response = np.int32([])
	
	dictIdx = 0
	for name, count in TrainSetInfo.items():
		# dir = \"D:/GJAI_data/gongjingai_pre/train_1-2-3/\" + name + \"/\"
		dir = \"TrainSet/\" + name + \"/\"
		labels, centers = np.load(\"Temp1/vocabulary/\" + name + \".npy\")
		
		print(\"Init training data of \" + name + \"...\")
		pathDir = os.listdir(dir)
		for i in pathDir:
			filename = os.path.join(\'%s%s\' % (dir, i))
			img = cv2.imread(filename)
			features = calcSiftFeature(img)
			featVec = calcFeatVec(features, centers)
			trainData = np.append(trainData, featVec, axis=0)
		
		res = np.repeat(dictIdx, count)
		response = np.append(response, res)
		dictIdx += 1
		print(\"Done\\n\")

	print(\"Now train svm classifier...\")
	trainData = np.float32(trainData)
	response = response.reshape(-1, 1)
	svm = cv2.ml.SVM_create()
	svm.setKernel(cv2.ml.SVM_LINEAR)
	# svm.train_auto(trainData, response, None, None, None) # select best params
	svm.train(trainData,cv2.ml.ROW_SAMPLE,response)
	svm.save(\"svm.clf\")
	print(\"Done\\n\")
	
def classify():
	# svm = cv2.SVM()
	# svm = cv2.ml.SVM_create()
	svm = cv2.ml.SVM_load(\"svm.clf\")
	
	total = 0; correct = 0; dictIdx = 0
	for name, count in TestSetInfo.items():
		crt = 0
		# dir = \"D:/GJAI_data/gongjingai_pre/validation_1-2-3/\" + name + \"/\"
		dir = \"TestSet/\" + name + \"/\"
		labels, centers = np.load(\"Temp1/vocabulary/\" + name + \".npy\")
		
		print(\"Classify on TestSet \" + name + \":\")
		pathDir = os.listdir(dir)
		for i in pathDir:
			filename = os.path.join(\'%s%s\' % (dir, i))
			img = cv2.imread(filename)
			features = calcSiftFeature(img)
			featVec = calcFeatVec(features, centers)
			case = np.float32(featVec)
			dict_svm = svm.predict(case)
			dict_svm = int(dict_svm[1])
			if (dictIdx == dict_svm):
				crt += 1
			
		print(\"Accuracy: \" + str(crt) + \" / \" + str(count) + \"\\n\")
		total += count
		correct += crt
		dictIdx += 1
		
	print(\"Total accuracy: \" + str(correct) + \" / \" + str(total))

if __name__ == \"__main__\":	
	initFeatureSet()
	learnVocabulary()
	trainClassifier()
	classify()

如有疑问，请评论。

继续阅读与本文标签相同的文章

无标签

2019“光谷高科技高成长20强”及“光谷明日之星”榜单揭晓

常见数据库的数据分页语法

收藏打印

python图像处理之sift-kmeans-SVM图像分类

浏览：459 2026-05-06

继续阅读与本文标签相同的文章

2019“光谷高科技高成长20强”及“光谷明日之星”榜单揭晓

常见数据库的数据分页语法

特别推荐 2026年05月18日星期一

精彩发现

热门标签

python图像处理之sift-kmeans-SVM图像分类

浏览：459 2026-05-06

继续阅读与本文标签相同的文章

2026-05-18栏目： 教程

2026-05-18栏目： 教程

2026-05-18栏目： 教程

2026-05-18栏目： 教程

2026-05-18栏目： 教程

2026-04-23栏目： 教程

2026-04-23栏目： 教程

2026-04-23栏目： 教程

2026-04-23栏目： 教程

2026-04-24栏目： 教程

特别推荐 2026年05月18日 星期一

精彩发现

热门标签

相关文章

2026-05-18栏目：教程

2026-05-18栏目：教程

2026-05-18栏目：教程

2026-05-18栏目：教程

2026-05-18栏目：教程

2026-04-23栏目：教程

2026-04-23栏目：教程

2026-04-23栏目：教程

2026-04-23栏目：教程

2026-04-24栏目：教程

特别推荐 2026年05月18日星期一