/****************************  omfhash.cpp  **********************************
* Author:        Agner Fog
* Date created:  2007-02-14
* Last modified: 2007-02-14
* Project:       objconv
* Module:        omfhash.cpp
* Description:
* This module contains code for searching and making hash tables for OMF
* libraries.
*
* Copyright 2007-2008 GNU General Public License http://www.gnu.org/licenses
*****************************************************************************/

#include "stdafx.h"

void COMFHashTable::Init(SOMFHashBlock * blocks, uint32 NumBlocks) {
   // Initialize
   this->blocks = blocks;                        // Pointer to blocks
   this->NumBlocks = NumBlocks;                  // Number of blocks
   String = 0;
   StringLength = 0;
}

// Rotate right 16-bit word
uint16 RotR(uint16 x, uint16 bits) {
   return (x >> bits) | (x << (16 - bits));
}

// Rotate left 16-bit word
uint16 RotL(uint16 x, uint16 bits) {
   return (x << bits) | (x >> (16 - bits));
}

void COMFHashTable::MakeHash(int8 * name) {
   // Compute hash according to the official algorithm
   uint8 * pb;                                   // Pointer for forward scan through string
   uint8 * pe;                                   // Pointer for backwards scan through string
   uint16 c;                                     // Current character converted to lower case
   uint16 BlockX;                                // Calculate block hash
   uint16 BucketX;                               // Calculate block hash
   String = (uint8*)name;                        // Type cast string to unsigned char *
   StringLength = (uint32)strlen(name);
   if (StringLength > 255) {
      // String too long
      err.submit(1204, name);                    // Warning: truncating
      StringLength = 255;
      String[StringLength] = 0;                  // Truncation modifies string source!
   }
   String = (uint8*)name;                        // Type cast to unsigned characters
   pb = String;                                  // Initialize pointer for forward scan
   pe = String + StringLength;                   // Initialize pointer for backward scan
   BlockX = BucketD = StringLength | 0x20;       // Initialize left-to-right scan
   BucketX = BlockD = 0;                         // Initialize right-to-left scan

   // Scan loop
   while (1) {
      c = *(--pe) | 0x20;                        // Read character for backward scan, make lower case
      BucketX = RotR(BucketX, 2) ^ c;            // Rotate, XOR
      BlockD  = RotL(BlockD,  2) ^ c;            // Rotate, XOR
      if (pe == String) break;                   // Stop loop when backward scan finished
      c = *(pb++) | 0x20;                        // Read character for forward scan, make lower case
      BlockX  = RotL(BlockX,  2) ^ c;            // Rotate, XOR
      BucketD = RotR(BucketD, 2) ^ c;            // Rotate, XOR
   }
   // Make values modulo number of blocks / buckets
   BlockX = BlockX % NumBlocks;
   BlockD = BlockD % NumBlocks;
   if (BlockD == 0) BlockD = 1;
   BucketX = BucketX % OMFNumBuckets;
   BucketD = BucketD % OMFNumBuckets;
   if (BucketD == 0) BucketD = 1;
   StartBlock  = BlockX;
   StartBucket = BucketX;
}


int  COMFHashTable::FindString(uint32 & ModulePage, uint32 & Conflicts) {
   // Search for String. 
   // Returns number of occurrences of String
   // Module receives the module page for the first occurrence
   // Conflicts receives the number of conflicting entries encountered before the match
   uint32 Num = 0;                               // Number of occurrences of string found
   uint16 Block;                                 // Block number
   uint16 Bucket;                                // Bucket number
   uint32 StringIndex;                           // Index to string
   Conflicts = 0;                                // Start counting Conflicts

   Block = StartBlock;
   Bucket = StartBucket;

   // Loop through blocks
   do {

      // Loop through buckets
      do {

         // String index of current bucket
         StringIndex = blocks[Block].b.Buckets[Bucket];
         if (StringIndex == 0) {
            if (blocks[Block].b.FreeSpace < 0xff) {
               // Empty bucket found. End of search
               return Num;
            }
            else {
               // Block is full. Search next block

               // Note: It would be logical to set StartBucket = Bucket
               // here in order to allow all buckets in the next block
               // to be tried, but the official algorithm doesn't seem
               // to do so!?
               // StartBucket = Bucket; 

               break;
            }
         }
         // Bucket contains a string. Is it the same string?
         if (blocks[Block].Strings[StringIndex*2] == StringLength
         && strncmp((int8*)&blocks[Block].Strings[StringIndex*2+1], (int8*)String, StringLength) == 0) {
            // Matching string found
            Num++;
            if (Num == 1) {
               // First occurrence. Save module number
               ModulePage = *(uint16*)&blocks[Block].Strings[StringIndex*2+1+StringLength];
            }
         }
         else {
            // Conflicting string found
            Conflicts++;
         }
         // Next bucket
         Bucket = (Bucket + BucketD) % OMFNumBuckets;
      } while (Bucket != StartBucket);

      // Next block
      Block = (Block + BlockD) % NumBlocks;
   }  while (Block != StartBlock);
   // Finished searching all blocks and buckets
   return Num;
}

int COMFHashTable::InsertString(uint16 & ModulePage) {
   // Insert string in hash table.
   // Parameter:
   // ModulePage = module address / page size
   // Return value:
   // 0 if success, 
   // 1 if identical string allready exists in the table. New string will not be entered.
   //   ModulePage will receive the module page of the existing string in this case.
   // 2 if table is full,
   uint16 Block;                                 // Block number
   uint16 Bucket;                                // Bucket number
   uint32 StringIndex;                           // Index to string space
   uint32 StringOffset;                          // Offset to string from begin of block
   uint32 SpaceRequired;                         // Space required to store string

   SpaceRequired = StringLength + 3;             // Space for string + stringlength + module index
   SpaceRequired = (SpaceRequired + 1) & uint32(-2);// Round up to nearest even

   Block = StartBlock;
   Bucket = StartBucket;

   // Loop through blocks
   do {

      // Loop through buckets
      do {

         // String index of current bucket
         StringIndex = blocks[Block].b.Buckets[Bucket];
         if (StringIndex == 0) {
            // Found empty bucket. Check if block has enough free space
            if (uint32(OMFBlockSize) - blocks[Block].b.FreeSpace * 2 < SpaceRequired) {
               // Not enough space in block.
               // Continue with same bucket in next block.

               // Note: It would be logical to set StartBucket = Bucket
               // here in order to allow all buckets in the next block
               // to be tried, but the official algorithm doesn't seem
               // to do so!?
               // StartBucket = Bucket; 
               break;
            }
            // Enough space found. Enter string in bucket
            StringIndex = blocks[Block].b.FreeSpace;
            blocks[Block].b.Buckets[Bucket] = StringIndex;
            // Address to store string
            StringOffset = StringIndex * 2;
            // Store string length
            blocks[Block].Strings[StringOffset] = (uint8)StringLength;
            // Copy string
            memcpy(blocks[Block].Strings + StringOffset + 1, String, StringLength);
            // Insert module page number
            *(uint16*)(blocks[Block].Strings + StringOffset + 1 + StringLength) = ModulePage;
            // Update free space
            blocks[Block].b.FreeSpace += (uint8)(SpaceRequired / 2);
            // Check if overflow
            if (blocks[Block].b.FreeSpace == 0) blocks[Block].b.FreeSpace = 0xFF;
            // Indicate success
            return 0;
         }
         else {
            // Bucket contains a string. Check if it is the same string
            if (blocks[Block].Strings[StringIndex*2] == StringLength
            && strncmp((int8*)(blocks[Block].Strings+StringIndex*2+1), (int8*)String, StringLength) == 0) {
               // Identical string found. Return module index for existing string entry
               ModulePage = *(uint16*)(blocks[Block].Strings+StringIndex*2+1+StringLength);
               // Indicate failure
               return 1;
            }
         }
         // Bucket was full. Go to next bucket
         Bucket = (Bucket + BucketD) % OMFNumBuckets;
      } while (Bucket != StartBucket);

      // If we got here, we have found no empty bucket in the block or 
      // there was not enough string space in the block.
      // We need to mark the block as full to tell the linker to
      // continue in next block when searching for this string
      // Whether the block has any empty buckets or not
      blocks[Block].b.FreeSpace = 0xFF;

      // Go to next block
      Block = (Block + BlockD) % NumBlocks;
   }  while (Block != StartBlock);

   // Finished searching all blocks and buckets
   // No empty space found. Indicate failure:
   return 2;
}


// Table of prime numbers
// You may add more prime numbers if very big library files are needed
static const uint32 PrimeNumbers[] = {
   1, 2, 3, 5, 7, 11, 13, 17, 19, 23, 29, 31, 37, 41, 43, 47, 53, 59, 61, 67, 71,
   73, 79, 83, 89, 97, 101, 103, 107, 109, 113, 127, 131, 137, 139, 149, 151, 157,
   163, 167, 173, 179, 181, 191, 193, 197, 199, 211, 223, 227, 229, 233, 239, 241,
   251, 257, 263, 269, 271, 277, 281, 283, 293, 307, 311, 313, 317, 331, 337, 347,
   349, 353, 359, 367, 373, 379, 383, 389, 397, 401, 409, 419, 421, 431, 433, 439,
   443, 449, 457, 461, 463, 467, 479, 487, 491, 499, 503, 509, 521, 523, 541, 547,
   557, 563, 569, 571, 577, 587, 593, 599, 601, 607, 613, 617, 619, 631, 641, 643,
   647, 653, 659, 661, 673, 677, 683, 691, 701, 709, 719, 727, 733, 739, 743, 751,
   757, 761, 769, 773, 787, 797, 809, 811, 821, 823, 827, 829, 839, 853, 857, 859,
   863, 877, 881, 883, 887, 907, 911, 919, 929, 937, 941, 947, 953, 967, 971, 977,
   983, 991, 997, 1009, 1013, 1019, 1021, 1031, 1033, 1039, 1049, 1051, 1061, 1063,
   1069, 1087, 1091, 1093, 1097, 1103, 1109, 1117, 1123, 1129, 1151, 1153, 1163,
   1171, 1181, 1187, 1193, 1201, 1213, 1217, 1223, 1229, 1231, 1237, 1249, 1259,
   1277, 1279, 1283, 1289, 1291, 1297, 1301, 1303, 1307, 1319, 1321, 1327, 1361,
   1367, 1373, 1381, 1399, 1409, 1423, 1427, 1429, 1433, 1439, 1447, 1451, 1453,
   1459, 1471, 1481, 1483, 1487, 1489, 1493, 1499, 1511, 1523, 1531, 1543, 1549,
   1553, 1559, 1567, 1571, 1579, 1583, 1597, 1601, 1607, 1609, 1613, 1619, 1621,
   1627, 1637, 1657, 1663, 1667, 1669, 1693, 1697, 1699, 1709, 1721, 1723, 1733,
   1741, 1747, 1753, 1759, 1777, 1783, 1787, 1789, 1801, 1811, 1823, 1831, 1847,
   1861, 1867, 1871, 1873, 1877, 1879, 1889, 1901, 1907, 1913, 1931, 1933, 1949,
   1951, 1973, 1979, 1987, 1993, 1997, 1999, 2003, 2011, 2017, 2027, 2029, 2039,
   2053, 2063, 2069, 2081, 2083, 2087, 2089, 2099, 2111, 2113, 2129, 2131, 2137,
   2141, 2143, 2153, 2161, 2179, 2203, 2207, 2213, 2221, 2237, 2239, 2243, 2251,
   2267, 2269, 2273, 2281, 2287, 2293, 2297, 2309, 2311, 2333, 2339, 2341, 2347,
   2351, 2357, 2371, 2377, 2381, 2383, 2389, 2393, 2399, 2411, 2417, 2423, 2437,
   2441, 2447, 2459, 2467, 2473, 2477, 2503, 2521, 2531, 2539, 2543, 2549, 2551,
   2557, 2579, 2591, 2593, 2609, 2617, 2621, 2633, 2647, 2657, 2659, 2663, 2671,
   2677, 2683, 2687, 2689, 2693, 2699, 2707, 2711, 2713, 2719, 2729, 2731, 2741,
   2749, 2753, 2767, 2777, 2789, 2791, 2797, 2801, 2803, 2819, 2833, 2837, 2843,
   2851, 2857, 2861, 2879, 2887, 2897, 2903, 2909, 2917, 2927, 2939, 2953, 2957,
   2963, 2969, 2971, 2999, 3001, 3011, 3019, 3023, 3037, 3041, 3049, 3061, 3067,
   3079, 3083, 3089, 3109, 3119, 3121, 3137, 3163, 3167, 3169, 3181, 3187, 3191,
   3203, 3209, 3217, 3221, 3229, 3251, 3253, 3257, 3259, 3271, 3299, 3301, 3307,
   3313, 3319, 3323, 3329, 3331, 3343, 3347, 3359, 3361, 3371, 3373, 3389, 3391,
   3407, 3413, 3433, 3449, 3457, 3461, 3463, 3467, 3469, 3491, 3499, 3511, 3517,
   3527, 3529, 3533, 3539, 3541, 3547, 3557, 3559, 3571, 3581, 3583, 3593, 3607,
   3613, 3617, 3623, 3631, 3637, 3643, 3659, 3671, 3673, 3677, 3691, 3697, 3701,
   3709, 3719, 3727, 3733, 3739, 3761, 3767, 3769, 3779, 3793, 3797, 3803, 3821,
   3823, 3833, 3847, 3851, 3853, 3863, 3877, 3881, 3889, 3907, 3911, 3917, 3919,
   3923, 3929, 3931, 3943, 3947, 3967, 3989, 4001, 4003, 4007, 4013, 4019, 4021,
   4027, 4049, 4051, 4057, 4073, 4079, 4091, 4093, 4099, 4111, 4127, 4129, 4133,
   4139, 4153, 4157, 4159, 4177, 4201, 4211, 4217, 4219, 4229, 4231, 4241, 4243,
   4253, 4259, 4261, 4271, 4273, 4283, 4289, 4297, 4327, 4337, 4339, 4349, 4357,
   4363, 4373, 4391, 4397, 4409, 4421, 4423, 4441, 4447, 4451, 4457, 4463, 4481,
   4483, 4493, 4507, 4513, 4517, 4519, 4523, 4547, 4549, 4561, 4567, 4583, 4591,
   4597, 4603, 4621, 4637, 4639, 4643, 4649, 4651, 4657, 4663, 4673, 4679, 4691,
   4703, 4721, 4723, 4729, 4733, 4751, 4759, 4783, 4787, 4789, 4793, 4799, 4801,
   4813, 4817, 4831, 4861, 4871, 4877, 4889, 4903, 4909, 4919, 4931, 4933, 4937,
   4943, 4951, 4957, 4967, 4969, 4973, 4987, 4993, 4999, 5003, 5009, 5011, 5021
};

// Length of table
static const uint32 PrimeNumbersLen = sizeof(PrimeNumbers)/sizeof(PrimeNumbers[0]);


void COMFHashTable::MakeHashTable(CSList<SStringEntry> & StringEntries, 
CMemoryBuffer & StringBuffer, CMemoryBuffer & OutFile, CLibrary * Library) {
   // Make hash table. Parameters:
   // StringEntries[].String = name of each public symbol as offset into StringBuffer
   // StringEntries[].Member = page address of member = offset / page size
   // StringBuffer = contains all strings
   // OutFile will receive the output hash table

   CSList<SOMFHashBlock> HashTable;              // Hash table
   COMFHashTable TableHandler;                   // Hash table handler
   uint32 NumBlocksI;                            // Number of blocks as index into prime number table
   uint32 BlockI;                                // Block index
   uint32 SymI;                                  // Symbol index
   int8 * String;                                // Symbol name
   uint16 Module1, Module2;                      // Module page = offset / page size
   int    Result;                                // 0 = success

   // Estimate required number of blocks
   NumBlocks = (StringEntries.GetNumEntries() * 8 + StringBuffer.GetDataSize()) / 256;
   // Find nearest prime number >= NumBlocks, but stay within the range from 2 to 251.
   // The minimum NumBlocks is 1, but some systems use 2 as the minimum.
   // The maximum is 251, but some linkers may allow a higher number

   for (NumBlocksI = 1; NumBlocksI < 55; NumBlocksI++) {
      if (PrimeNumbers[NumBlocksI] >= NumBlocks) break;
   }

   // Try if this number of blocks is sufficient
   while (NumBlocksI < PrimeNumbersLen) {

      // Get number of blocks from prime numbers table
      NumBlocks = PrimeNumbers[NumBlocksI];

      // Check if <= 251
      if (NumBlocks > 255) err.submit(1215); // Number of blocks exceeds official limit. May still work with some linkers

      // Allocate space for hash table
      HashTable.SetNum(NumBlocks);
      memset(&HashTable[0], 0, NumBlocks * OMFBlockSize);

      // Initialize hash table handler
      TableHandler.Init(&HashTable[0], NumBlocks);

      // Set free space pointers
      for (BlockI = 0; BlockI < NumBlocks; BlockI++) {
         TableHandler.blocks[BlockI].b.FreeSpace = 19;
      }
      Result = 0;

      // Insert symbols
      // Loop through symbols
      for (SymI = 0; SymI < StringEntries.GetNumEntries(); SymI++) {

         // Symbol name
         String = StringBuffer.Buf() + StringEntries[SymI].String;

         // Module page
         Module1 = Module2 = StringEntries[SymI].Member;

         // Insert name in table
         TableHandler.MakeHash(String);
         Result = TableHandler.InsertString(Module2);

         if (Result == 1) {
            // String already exists
            // Compose error string "Modulename1 and Modulename2"
            char ErrorModuleNames[64];
            strcpy(ErrorModuleNames, Library->GetModuleName(Module1));
            strcpy(ErrorModuleNames + strlen(ErrorModuleNames), " and ");
            strcpy(ErrorModuleNames + strlen(ErrorModuleNames), Library->GetModuleName(Module2));
            // submit error message
            err.submit(1214, String, ErrorModuleNames);
         }
         if (Result == 2) {
            // Table is full. Stop and repeat with a higher NumBlocks
            break;
         }
      } // End of loop through symbols

      if (Result < 2) {
         // Finished with success
         // Store hash table
         OutFile.Push(&HashTable[0], HashTable.GetNumEntries() * OMFBlockSize);
         return;
      }

      // Table is full. Try again with a higher number of blocks
      NumBlocksI++;
   }

   // End of loop through PrimeNumbers table
   err.submit(2605);                             // Failed to make table
}
