summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
-rw-r--r--Makefile27
-rw-r--r--__init__.py11
-rw-r--r--crc32.cpp41
-rw-r--r--crc32.h11
-rw-r--r--ed2k.cpp41
-rw-r--r--ed2k.h17
-rw-r--r--hash.cpp85
-rw-r--r--hash.h37
-rw-r--r--hash_wrapper.cpp14
9 files changed, 284 insertions, 0 deletions
diff --git a/Makefile b/Makefile
new file mode 100644
index 0000000..0d897d0
--- /dev/null
+++ b/Makefile
@@ -0,0 +1,27 @@
+CC=gcc
+CFLAGS=
+CPP=g++
+CPPFLAGS=
+LD=gcc
+LDFLAGS=-shared
+
+OBJECTS=hash_wrapper.o hash.o crc32.o ed2k.o
+TARGET=_hash.so
+INCLUDE=-I /usr/include/python2.4/
+LIB=-l boost_python -l ssl
+
+all: $(TARGET)
+
+clean:
+ -rm $(TARGET) $(OBJECTS)
+
+# Mål-regel
+$(TARGET): $(OBJECTS) Makefile
+ $(LD) $(LDFLAGS) -o $(TARGET) $(OBJECTS) $(LIB)
+
+# Pseudoregler
+%.o: %.c Makefile
+ $(CC) $(CFLAGS) -o $@ -c $< $(INCLUDE)
+
+%.o: %.cpp Makefile
+ $(CPP) $(CPPFLAGS) -o $@ -c $< $(INCLUDE) \ No newline at end of file
diff --git a/__init__.py b/__init__.py
new file mode 100644
index 0000000..0333819
--- /dev/null
+++ b/__init__.py
@@ -0,0 +1,11 @@
+from _hash import *
+
+def file_hash(name):
+ h = Hash()
+ f = open(name)
+ data = f.read(32768)
+ while data:
+ h.update(data)
+ data = f.read(32768)
+ f.close()
+ return h \ No newline at end of file
diff --git a/crc32.cpp b/crc32.cpp
new file mode 100644
index 0000000..55d6dd2
--- /dev/null
+++ b/crc32.cpp
@@ -0,0 +1,41 @@
+#include "crc32.h"
+
+int* CRC32::crc_table;
+
+int* CRC32::generate_table() {
+ int crc;
+ int* table = new int[256];
+ for(int i = 0; i < 256; i++) {
+ crc = i << 24;
+ for(int j = 0; j < 8; j++) {
+ if(crc & 0x80000000) {
+ crc = (crc << 1) ^ 0x04c11db7;
+ } else {
+ crc = crc << 1;
+ }
+ }
+ table[i] = crc;
+ }
+ return table;
+}
+
+int CRC32::reflect(int data, int bits) {
+ int x = 0;
+ for(int i = 0; i < bits; i++) {
+ x = x << 1;
+ x |= data & 1;
+ data = data >> 1;
+ }
+ return x;
+}
+
+int CRC32::crc32(int crc, const char* data, int length) {
+ crc = ~reflect(crc, 32);
+ if(!crc_table) {
+ crc_table = generate_table();
+ }
+ for (int i = 0; i < length; i++) {
+ crc = (crc << 8) ^ crc_table[((crc >> 24) ^ reflect(data[i], 8)) & 0xff];
+ }
+ return ~reflect(crc, 32);
+}
diff --git a/crc32.h b/crc32.h
new file mode 100644
index 0000000..646ccce
--- /dev/null
+++ b/crc32.h
@@ -0,0 +1,11 @@
+#ifndef _CRC32_H_
+#define _CRC32_H_
+
+namespace CRC32 {
+ extern int* crc_table;
+ int* generate_table();
+ int reflect(int data, int bits);
+ int crc32(int crc, const char* data, int length);
+}
+
+#endif // _CRC32_H_
diff --git a/ed2k.cpp b/ed2k.cpp
new file mode 100644
index 0000000..92e7b15
--- /dev/null
+++ b/ed2k.cpp
@@ -0,0 +1,41 @@
+#include "ed2k.h"
+
+template<class T>
+inline T min(T a, T b) {
+ return (a > b) ? b : a;
+}
+
+Ed2k::Ed2k() {
+ MD4_Init(&md4_partial);
+ MD4_Init(&md4_final);
+ size_total = 0;
+}
+
+void Ed2k::update(const char* data, int length) {
+ while(length) {
+ if(!(size_total % (9500 * 1024)) && size_total) {
+ unsigned char digest[16];
+ MD4_Final(digest, &md4_partial);
+ MD4_Update(&md4_final, digest, 16);
+ MD4_Init(&md4_partial);
+ }
+ int size = min<int>(length, (9500 * 1024) - (size_total % (9500 * 1024)));
+ MD4_Update(&md4_partial, data, size);
+ length -= size;
+ data += size;
+ size_total += size;
+ };
+}
+
+char* Ed2k::digest() {
+ char* digest = new char[16];
+ if(size_total > (9500 * 1024)) {
+ unsigned char digest_partial[16];
+ MD4_Final(digest_partial, &md4_partial);
+ MD4_Update(&md4_final, digest_partial, 16);
+ MD4_Final((unsigned char*)digest, &md4_final);
+ } else {
+ MD4_Final((unsigned char*)digest, &md4_partial);
+ }
+ return digest;
+}
diff --git a/ed2k.h b/ed2k.h
new file mode 100644
index 0000000..1be7302
--- /dev/null
+++ b/ed2k.h
@@ -0,0 +1,17 @@
+#ifndef _ED2K_H_
+#define _ED2K_H_
+
+#include <openssl/md4.h>
+
+class Ed2k {
+ private:
+ MD4_CTX md4_partial;
+ MD4_CTX md4_final;
+ unsigned int size_total;
+ public:
+ Ed2k();
+ void update(const char* data, int length);
+ char* digest();
+};
+
+#endif // _ED2K_H_
diff --git a/hash.cpp b/hash.cpp
new file mode 100644
index 0000000..d844c46
--- /dev/null
+++ b/hash.cpp
@@ -0,0 +1,85 @@
+#include "hash.h"
+#include "crc32.h"
+
+#include <stdexcept>
+
+namespace Hex {
+ static char* digits = "0123456789abcdef";
+ std::string hex(char* bin, int length) {
+ std::string s(length * 2, ' ');
+ for(int i = 0; i < length; i++) {
+ s[i*2] = digits[(bin[i] >> 4) & 0xf];
+ s[i*2+1] = digits[bin[i] & 0xf];
+ }
+ return s;
+ }
+ std::string hex(int bin) {
+ std::string s(sizeof(int) * 2, ' ');
+ for(int i = 0; i < sizeof(int) * 2; i++) {
+ s[sizeof(int) * 2 - 1 - i] = digits[bin & 0xf];
+ bin = bin >> 4;
+ }
+ return s;
+ }
+}
+
+Hash::Hash() {
+ finished = false;
+
+ crc32_ctx = 0;
+ crc32_str = "";
+
+ ed2k_str = "";
+
+ MD5_Init(&md5_ctx);
+ md5_str = "";
+
+ SHA1_Init(&sha1_ctx);
+ sha1_str = "";
+}
+
+void Hash::update(std::string data) {
+ if(finished) {
+ throw std::runtime_error("Can't update after digest.");
+ }
+ crc32_ctx = CRC32::crc32(crc32_ctx, data.c_str(), data.length());
+ ed2k_ctx.update(data.c_str(), data.length());
+ MD5_Update(&md5_ctx, data.c_str(), data.length());
+ SHA1_Update(&sha1_ctx, data.c_str(), data.length());
+}
+
+std::string Hash::crc32() {
+ return Hex::hex(crc32_ctx);
+}
+
+std::string Hash::ed2k() {
+ if(!ed2k_str.length()) {
+ finished = true;
+ char* digest = ed2k_ctx.digest();
+ ed2k_str = Hex::hex(digest, 16);
+ delete digest;
+ }
+ return ed2k_str;
+}
+
+std::string Hash::md5() {
+ if(!md5_str.length()) {
+ finished = true;
+ char* digest = new char[16];
+ MD5_Final((unsigned char*)digest, &md5_ctx);
+ md5_str = Hex::hex(digest, 16);
+ delete digest;
+ }
+ return md5_str;
+}
+
+std::string Hash::sha1() {
+ if(!sha1_str.length()) {
+ finished = true;
+ char* digest = new char[20];
+ SHA1_Final((unsigned char*)digest, &sha1_ctx);
+ sha1_str = Hex::hex(digest, 20);
+ delete digest;
+ }
+ return sha1_str;
+}
diff --git a/hash.h b/hash.h
new file mode 100644
index 0000000..3c7b9c9
--- /dev/null
+++ b/hash.h
@@ -0,0 +1,37 @@
+#ifndef _HASH_H_
+#define _HASH_H_
+
+#include <string>
+
+#include "ed2k.h"
+
+#include <openssl/md4.h>
+#include <openssl/md5.h>
+#include <openssl/sha.h>
+
+class Hash {
+ private:
+ bool finished;
+
+ int crc32_ctx;
+ std::string crc32_str;
+
+ Ed2k ed2k_ctx;
+ std::string ed2k_str;
+
+ MD5_CTX md5_ctx;
+ std::string md5_str;
+
+ SHA_CTX sha1_ctx;
+ std::string sha1_str;
+
+ public:
+ Hash();
+ void update(std::string data);
+ std::string crc32();
+ std::string ed2k();
+ std::string md5();
+ std::string sha1();
+};
+
+#endif // _HASH_H_
diff --git a/hash_wrapper.cpp b/hash_wrapper.cpp
new file mode 100644
index 0000000..a4173b9
--- /dev/null
+++ b/hash_wrapper.cpp
@@ -0,0 +1,14 @@
+#include "hash.h"
+
+#include <boost/python.hpp>
+using namespace boost::python;
+
+BOOST_PYTHON_MODULE(_hash)
+{
+ class_<Hash>("Hash")
+ .def("update", &Hash::update)
+ .def("crc32", &Hash::crc32)
+ .def("ed2k", &Hash::ed2k)
+ .def("md5", &Hash::md5)
+ .def("sha1", &Hash::sha1);
+}