From 3a5b32f44a95b989e39273527fc924ad3d32465e Mon Sep 17 00:00:00 2001 From: zyp Date: Mon, 8 May 2006 12:54:40 +0000 Subject: [project @ zyp-20060508125440-a3cc6ea65de180a0] [project @ 23] Seperated from disccat to a standalone project. --- Makefile | 27 ++++++++++++++++++ __init__.py | 11 ++++++++ crc32.cpp | 41 +++++++++++++++++++++++++++ crc32.h | 11 ++++++++ ed2k.cpp | 41 +++++++++++++++++++++++++++ ed2k.h | 17 ++++++++++++ hash.cpp | 85 ++++++++++++++++++++++++++++++++++++++++++++++++++++++++ hash.h | 37 ++++++++++++++++++++++++ hash_wrapper.cpp | 14 ++++++++++ 9 files changed, 284 insertions(+) create mode 100644 Makefile create mode 100644 __init__.py create mode 100644 crc32.cpp create mode 100644 crc32.h create mode 100644 ed2k.cpp create mode 100644 ed2k.h create mode 100644 hash.cpp create mode 100644 hash.h create mode 100644 hash_wrapper.cpp diff --git a/Makefile b/Makefile new file mode 100644 index 0000000..0d897d0 --- /dev/null +++ b/Makefile @@ -0,0 +1,27 @@ +CC=gcc +CFLAGS= +CPP=g++ +CPPFLAGS= +LD=gcc +LDFLAGS=-shared + +OBJECTS=hash_wrapper.o hash.o crc32.o ed2k.o +TARGET=_hash.so +INCLUDE=-I /usr/include/python2.4/ +LIB=-l boost_python -l ssl + +all: $(TARGET) + +clean: + -rm $(TARGET) $(OBJECTS) + +# Mål-regel +$(TARGET): $(OBJECTS) Makefile + $(LD) $(LDFLAGS) -o $(TARGET) $(OBJECTS) $(LIB) + +# Pseudoregler +%.o: %.c Makefile + $(CC) $(CFLAGS) -o $@ -c $< $(INCLUDE) + +%.o: %.cpp Makefile + $(CPP) $(CPPFLAGS) -o $@ -c $< $(INCLUDE) \ No newline at end of file diff --git a/__init__.py b/__init__.py new file mode 100644 index 0000000..0333819 --- /dev/null +++ b/__init__.py @@ -0,0 +1,11 @@ +from _hash import * + +def file_hash(name): + h = Hash() + f = open(name) + data = f.read(32768) + while data: + h.update(data) + data = f.read(32768) + f.close() + return h \ No newline at end of file diff --git a/crc32.cpp b/crc32.cpp new file mode 100644 index 0000000..55d6dd2 --- /dev/null +++ b/crc32.cpp @@ -0,0 +1,41 @@ +#include "crc32.h" + +int* CRC32::crc_table; + +int* CRC32::generate_table() { + int crc; + int* table = new int[256]; + for(int i = 0; i < 256; i++) { + crc = i << 24; + for(int j = 0; j < 8; j++) { + if(crc & 0x80000000) { + crc = (crc << 1) ^ 0x04c11db7; + } else { + crc = crc << 1; + } + } + table[i] = crc; + } + return table; +} + +int CRC32::reflect(int data, int bits) { + int x = 0; + for(int i = 0; i < bits; i++) { + x = x << 1; + x |= data & 1; + data = data >> 1; + } + return x; +} + +int CRC32::crc32(int crc, const char* data, int length) { + crc = ~reflect(crc, 32); + if(!crc_table) { + crc_table = generate_table(); + } + for (int i = 0; i < length; i++) { + crc = (crc << 8) ^ crc_table[((crc >> 24) ^ reflect(data[i], 8)) & 0xff]; + } + return ~reflect(crc, 32); +} diff --git a/crc32.h b/crc32.h new file mode 100644 index 0000000..646ccce --- /dev/null +++ b/crc32.h @@ -0,0 +1,11 @@ +#ifndef _CRC32_H_ +#define _CRC32_H_ + +namespace CRC32 { + extern int* crc_table; + int* generate_table(); + int reflect(int data, int bits); + int crc32(int crc, const char* data, int length); +} + +#endif // _CRC32_H_ diff --git a/ed2k.cpp b/ed2k.cpp new file mode 100644 index 0000000..92e7b15 --- /dev/null +++ b/ed2k.cpp @@ -0,0 +1,41 @@ +#include "ed2k.h" + +template +inline T min(T a, T b) { + return (a > b) ? b : a; +} + +Ed2k::Ed2k() { + MD4_Init(&md4_partial); + MD4_Init(&md4_final); + size_total = 0; +} + +void Ed2k::update(const char* data, int length) { + while(length) { + if(!(size_total % (9500 * 1024)) && size_total) { + unsigned char digest[16]; + MD4_Final(digest, &md4_partial); + MD4_Update(&md4_final, digest, 16); + MD4_Init(&md4_partial); + } + int size = min(length, (9500 * 1024) - (size_total % (9500 * 1024))); + MD4_Update(&md4_partial, data, size); + length -= size; + data += size; + size_total += size; + }; +} + +char* Ed2k::digest() { + char* digest = new char[16]; + if(size_total > (9500 * 1024)) { + unsigned char digest_partial[16]; + MD4_Final(digest_partial, &md4_partial); + MD4_Update(&md4_final, digest_partial, 16); + MD4_Final((unsigned char*)digest, &md4_final); + } else { + MD4_Final((unsigned char*)digest, &md4_partial); + } + return digest; +} diff --git a/ed2k.h b/ed2k.h new file mode 100644 index 0000000..1be7302 --- /dev/null +++ b/ed2k.h @@ -0,0 +1,17 @@ +#ifndef _ED2K_H_ +#define _ED2K_H_ + +#include + +class Ed2k { + private: + MD4_CTX md4_partial; + MD4_CTX md4_final; + unsigned int size_total; + public: + Ed2k(); + void update(const char* data, int length); + char* digest(); +}; + +#endif // _ED2K_H_ diff --git a/hash.cpp b/hash.cpp new file mode 100644 index 0000000..d844c46 --- /dev/null +++ b/hash.cpp @@ -0,0 +1,85 @@ +#include "hash.h" +#include "crc32.h" + +#include + +namespace Hex { + static char* digits = "0123456789abcdef"; + std::string hex(char* bin, int length) { + std::string s(length * 2, ' '); + for(int i = 0; i < length; i++) { + s[i*2] = digits[(bin[i] >> 4) & 0xf]; + s[i*2+1] = digits[bin[i] & 0xf]; + } + return s; + } + std::string hex(int bin) { + std::string s(sizeof(int) * 2, ' '); + for(int i = 0; i < sizeof(int) * 2; i++) { + s[sizeof(int) * 2 - 1 - i] = digits[bin & 0xf]; + bin = bin >> 4; + } + return s; + } +} + +Hash::Hash() { + finished = false; + + crc32_ctx = 0; + crc32_str = ""; + + ed2k_str = ""; + + MD5_Init(&md5_ctx); + md5_str = ""; + + SHA1_Init(&sha1_ctx); + sha1_str = ""; +} + +void Hash::update(std::string data) { + if(finished) { + throw std::runtime_error("Can't update after digest."); + } + crc32_ctx = CRC32::crc32(crc32_ctx, data.c_str(), data.length()); + ed2k_ctx.update(data.c_str(), data.length()); + MD5_Update(&md5_ctx, data.c_str(), data.length()); + SHA1_Update(&sha1_ctx, data.c_str(), data.length()); +} + +std::string Hash::crc32() { + return Hex::hex(crc32_ctx); +} + +std::string Hash::ed2k() { + if(!ed2k_str.length()) { + finished = true; + char* digest = ed2k_ctx.digest(); + ed2k_str = Hex::hex(digest, 16); + delete digest; + } + return ed2k_str; +} + +std::string Hash::md5() { + if(!md5_str.length()) { + finished = true; + char* digest = new char[16]; + MD5_Final((unsigned char*)digest, &md5_ctx); + md5_str = Hex::hex(digest, 16); + delete digest; + } + return md5_str; +} + +std::string Hash::sha1() { + if(!sha1_str.length()) { + finished = true; + char* digest = new char[20]; + SHA1_Final((unsigned char*)digest, &sha1_ctx); + sha1_str = Hex::hex(digest, 20); + delete digest; + } + return sha1_str; +} diff --git a/hash.h b/hash.h new file mode 100644 index 0000000..3c7b9c9 --- /dev/null +++ b/hash.h @@ -0,0 +1,37 @@ +#ifndef _HASH_H_ +#define _HASH_H_ + +#include + +#include "ed2k.h" + +#include +#include +#include + +class Hash { + private: + bool finished; + + int crc32_ctx; + std::string crc32_str; + + Ed2k ed2k_ctx; + std::string ed2k_str; + + MD5_CTX md5_ctx; + std::string md5_str; + + SHA_CTX sha1_ctx; + std::string sha1_str; + + public: + Hash(); + void update(std::string data); + std::string crc32(); + std::string ed2k(); + std::string md5(); + std::string sha1(); +}; + +#endif // _HASH_H_ diff --git a/hash_wrapper.cpp b/hash_wrapper.cpp new file mode 100644 index 0000000..a4173b9 --- /dev/null +++ b/hash_wrapper.cpp @@ -0,0 +1,14 @@ +#include "hash.h" + +#include +using namespace boost::python; + +BOOST_PYTHON_MODULE(_hash) +{ + class_("Hash") + .def("update", &Hash::update) + .def("crc32", &Hash::crc32) + .def("ed2k", &Hash::ed2k) + .def("md5", &Hash::md5) + .def("sha1", &Hash::sha1); +} -- cgit v1.2.3