SHA256 支持整数吗?
Does SHA256 favor integers?
在早些时候编码时,我注意到一些关于 SHA256 的东西 st运行ge,因为它似乎为散列生成的整数多于字母。起初我以为我只是在想象它,所以我做了一个快速测试来确定。令人惊讶的是,我的测试似乎证明 SHA256 在它生成的散列中偏爱整数值。我想知道这是为什么。散列索引是字母和数字之间的区别不应该完全相同吗?这是我的测试示例:
namespace TestingApp
{
static class Program
{
private static string letters = "abcdefghijklmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ1234567890";
private static char[] characters = letters.ToCharArray();
private static Random _rng = new Random();
static void Main(string[] args)
{
int totalIntegers = 0;
int totalLetters = 0;
for (int testingIntervals = 0; testingIntervals < 3000; testingIntervals++)
{
string randomString = NextString(10);
string checksum = DreamforceChecksum.GenerateSHA256(randomString);
int integerCount = checksum.Count(Char.IsDigit);
int letterCount = checksum.Count(Char.IsLetter);
Console.WriteLine("String: " + randomString);
Console.WriteLine("Checksum: " + checksum);
Console.WriteLine("Integers: " + integerCount);
Console.WriteLine("Letters: " + letterCount);
totalIntegers += integerCount;
totalLetters += letterCount;
}
Console.WriteLine("Total Integers: " + totalIntegers);
Console.WriteLine("Total Letters: " + totalLetters);
Console.Read();
}
private static string NextString(int length)
{
StringBuilder builder = new StringBuilder();
for (int i = 0; i < length; i++)
{
builder.Append(characters[_rng.Next(characters.Length)]);
}
return builder.ToString();
}
}
}
和我的 checksum/hashing class:
using System;
using System.Collections.Generic;
using System.Linq;
using System.Security.Cryptography;
using System.Text;
using System.Threading.Tasks;
namespace DreamforceFramework.Framework.Cryptography
{
public static class DreamforceChecksum
{
private static readonly SHA256Managed _shaManagedInstance = new SHA256Managed();
private static readonly StringBuilder _checksumBuilder = new StringBuilder();
public static string GenerateSHA256(string text)
{
byte[] bytes = Encoding.UTF8.GetBytes(text);
byte[] hash = _shaManagedInstance.ComputeHash(bytes);
_checksumBuilder.Clear();
for (int index = 0; index < hash.Length; index++)
{
_checksumBuilder.Append(hash[index].ToString("x2"));
}
return _checksumBuilder.ToString();
}
public static byte[] GenerateSHA256Bytes(string text)
{
byte[] bytes = Encoding.UTF8.GetBytes(text);
byte[] hash = _shaManagedInstance.ComputeHash(bytes);
_checksumBuilder.Clear();
for (int index = 0; index < hash.Length; index++)
{
_checksumBuilder.Append(hash[index].ToString("x2"));
}
return Encoding.UTF8.GetBytes(_checksumBuilder.ToString());
}
public static bool ValidateDataIntegrity(string data, string targetHashcode)
{
return GenerateSHA256(data).Equals(targetHashcode);
}
}
}
我有多次 运行 我的测试,每次似乎在散列中生成的整数多于字母。这里有 3 个测试运行:
有谁知道为什么 SHA256 似乎偏爱数字而不是字母和数字的平均分布?
假设有10个数字和6个字母可能,比例应该是10:6。这与您的结果完全一致。
输出为十六进制。 0-9 和 a-f
在早些时候编码时,我注意到一些关于 SHA256 的东西 st运行ge,因为它似乎为散列生成的整数多于字母。起初我以为我只是在想象它,所以我做了一个快速测试来确定。令人惊讶的是,我的测试似乎证明 SHA256 在它生成的散列中偏爱整数值。我想知道这是为什么。散列索引是字母和数字之间的区别不应该完全相同吗?这是我的测试示例:
namespace TestingApp
{
static class Program
{
private static string letters = "abcdefghijklmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ1234567890";
private static char[] characters = letters.ToCharArray();
private static Random _rng = new Random();
static void Main(string[] args)
{
int totalIntegers = 0;
int totalLetters = 0;
for (int testingIntervals = 0; testingIntervals < 3000; testingIntervals++)
{
string randomString = NextString(10);
string checksum = DreamforceChecksum.GenerateSHA256(randomString);
int integerCount = checksum.Count(Char.IsDigit);
int letterCount = checksum.Count(Char.IsLetter);
Console.WriteLine("String: " + randomString);
Console.WriteLine("Checksum: " + checksum);
Console.WriteLine("Integers: " + integerCount);
Console.WriteLine("Letters: " + letterCount);
totalIntegers += integerCount;
totalLetters += letterCount;
}
Console.WriteLine("Total Integers: " + totalIntegers);
Console.WriteLine("Total Letters: " + totalLetters);
Console.Read();
}
private static string NextString(int length)
{
StringBuilder builder = new StringBuilder();
for (int i = 0; i < length; i++)
{
builder.Append(characters[_rng.Next(characters.Length)]);
}
return builder.ToString();
}
}
}
和我的 checksum/hashing class:
using System;
using System.Collections.Generic;
using System.Linq;
using System.Security.Cryptography;
using System.Text;
using System.Threading.Tasks;
namespace DreamforceFramework.Framework.Cryptography
{
public static class DreamforceChecksum
{
private static readonly SHA256Managed _shaManagedInstance = new SHA256Managed();
private static readonly StringBuilder _checksumBuilder = new StringBuilder();
public static string GenerateSHA256(string text)
{
byte[] bytes = Encoding.UTF8.GetBytes(text);
byte[] hash = _shaManagedInstance.ComputeHash(bytes);
_checksumBuilder.Clear();
for (int index = 0; index < hash.Length; index++)
{
_checksumBuilder.Append(hash[index].ToString("x2"));
}
return _checksumBuilder.ToString();
}
public static byte[] GenerateSHA256Bytes(string text)
{
byte[] bytes = Encoding.UTF8.GetBytes(text);
byte[] hash = _shaManagedInstance.ComputeHash(bytes);
_checksumBuilder.Clear();
for (int index = 0; index < hash.Length; index++)
{
_checksumBuilder.Append(hash[index].ToString("x2"));
}
return Encoding.UTF8.GetBytes(_checksumBuilder.ToString());
}
public static bool ValidateDataIntegrity(string data, string targetHashcode)
{
return GenerateSHA256(data).Equals(targetHashcode);
}
}
}
我有多次 运行 我的测试,每次似乎在散列中生成的整数多于字母。这里有 3 个测试运行:
有谁知道为什么 SHA256 似乎偏爱数字而不是字母和数字的平均分布?
假设有10个数字和6个字母可能,比例应该是10:6。这与您的结果完全一致。
输出为十六进制。 0-9 和 a-f