我从iphone画廊的视频文件中计算md5总和。每次我选择相同的文件,它有不同的md5总和。我还检查数据长度(以字节为单位)并保持不变。所以我的问题是 - 为什么?以下是一些代码,其中包含了我试图制作它的许多方法。
- (void)imagePickerController:(UIImagePickerController *)picker didFinishPickingMediaWithInfo:(NSDictionary *)info
{
NSString *mediaType = [info objectForKey:UIImagePickerControllerMediaType];
if ([mediaType isEqualToString:@"public.movie"])
{
NSURL *videoURL = [info objectForKey:UIImagePickerControllerMediaURL];
videoData = [NSData dataWithContentsOfURL:videoURL];
[videoData retain];
NSLog(@"VIDEO DATA MD5: %@", [videoData md5]);
NSLog(@"VIDEO DATA LEN: %d", videoData.length);
}
[self dismissModalViewControllerAnimated:YES];
}
#import <CommonCrypto/CommonDigest.h>
@implementation NSData(MD5)
- (NSString*)MD5
{
// Create byte array of unsigned chars
unsigned char md5Buffer[CC_MD5_DIGEST_LENGTH];
// Create 16 byte MD5 hash value, store in buffer
CC_MD5(self.bytes, self.length, md5Buffer);
// Convert unsigned char buffer to NSString of hex values
NSMutableString *output = [NSMutableString stringWithCapacity:CC_MD5_DIGEST_LENGTH * 2];
for(int i = 0; i < CC_MD5_DIGEST_LENGTH; i++)
[output appendFormat:@"%02x",md5Buffer[i]];
return output;
}
@end
答案 0 :(得分:0)
我可以确认这种行为。无论选择何种散列函数,它都会发生(我尝试了 MD5、SHA1 和 SHA256)。
问题似乎是 NSData
。我从完全相同的文件创建了两个 NSData
实例,然后使用 [data1 isEqualTo:data2]
并返回 true。但是,通过 CC_SHA1
散列算法运行它们会为每个散列返回不同的散列。
要解决此问题,请删除 NSData
。而是使用较低级别的 C API 打开文件。这是 C 语言的示例。请注意“创建”约定——您负责在完成后释放返回的 char*
缓冲区。使用这种方法每次都会产生相同的哈希值。
char* _Nullable createBufferWithContentsOfFileAndReportLength(NSString* _Nonnull fileToScan, long* _Nullable length)
{
char const *pathToFile = [fileToScan cStringUsingEncoding:NSUTF8StringEncoding];
FILE *file = fopen(pathToFile, "r");
if (file == NULL) {
NSLog(@"Unable to open file: %@", fileToScan);
return NULL;
}
//
// Get the file length.
// 'fileLength' will be the number of bytes in the file. It will not include a null terminator or EOF. Some UTF8 characters require more than one byte, so we
// can't guarantee that fileLength is also the number of characters.
// NOTE: We don't use the fseek()/ftell()/rewind approach because it's not secure. See CERT FIO19-C advisory for details.
//
int fd = fileno(file);
if (fd < 0) {
NSLog(@"Unable to get a file descriptor for: %@", fileToScan);
fclose(file);
return NULL;
}
struct stat statBuffer;
if (fstat(fd, &statBuffer) == -1) {
NSLog(@"Unable to retrieve stats about this file: %@", fileToScan);
fclose(file);
return NULL;
}
long fileLength = statBuffer.st_size;
char *buffer = malloc(sizeof(char) * (fileLength + 1)); // enough memory to read the entire file, plus a spot for the null terminator
if (buffer == NULL) {
NSLog(@"Unable to allocate memory for: %@", fileToScan);
fclose(file);
return NULL;
}
fread(buffer, fileLength, sizeof(char), file);
buffer[fileLength] = '\0'; // No +1; this is zero-indexed. If fileLength is 5 characters, the 5th slot in the array needs to be the null terminator.
fclose(file);
if (length != NULL) {
*length = fileLength + 1;
}
return buffer;
}