FileSignatureChecker.cs 9.2 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240
  1. /* This file is part of SevenZipSharp.
  2. SevenZipSharp is free software: you can redistribute it and/or modify
  3. it under the terms of the GNU Lesser General Public License as published by
  4. the Free Software Foundation, either version 3 of the License, or
  5. (at your option) any later version.
  6. SevenZipSharp is distributed in the hope that it will be useful,
  7. but WITHOUT ANY WARRANTY; without even the implied warranty of
  8. MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  9. GNU Lesser General Public License for more details.
  10. You should have received a copy of the GNU Lesser General Public License
  11. along with SevenZipSharp. If not, see <http://www.gnu.org/licenses/>.
  12. */
  13. using System;
  14. using System.IO;
  15. namespace SevenZip
  16. {
  17. #if UNMANAGED
  18. /// <summary>
  19. /// The signature checker class. Original code by Siddharth Uppal, adapted by Markhor.
  20. /// </summary>
  21. /// <remarks>Based on the code at http://blog.somecreativity.com/2008/04/08/how-to-check-if-a-file-is-compressed-in-c/#</remarks>
  22. internal static class FileChecker
  23. {
  24. private const int SIGNATURE_SIZE = 16;
  25. private const int SFX_SCAN_LENGTH = 256 * 1024;
  26. private static bool SpecialDetect(Stream stream, int offset, InArchiveFormat expectedFormat)
  27. {
  28. if (stream.Length > offset + SIGNATURE_SIZE)
  29. {
  30. var signature = new byte[SIGNATURE_SIZE];
  31. int bytesRequired = SIGNATURE_SIZE;
  32. int index = 0;
  33. stream.Seek(offset, SeekOrigin.Begin);
  34. while (bytesRequired > 0)
  35. {
  36. int bytesRead = stream.Read(signature, index, bytesRequired);
  37. bytesRequired -= bytesRead;
  38. index += bytesRead;
  39. }
  40. string actualSignature = BitConverter.ToString(signature);
  41. foreach (string expectedSignature in Formats.InSignatureFormats.Keys)
  42. {
  43. if (Formats.InSignatureFormats[expectedSignature] != expectedFormat)
  44. {
  45. continue;
  46. }
  47. if (actualSignature.StartsWith(expectedSignature, StringComparison.OrdinalIgnoreCase))
  48. {
  49. return true;
  50. }
  51. }
  52. }
  53. return false;
  54. }
  55. /// <summary>
  56. /// Gets the InArchiveFormat for a specific extension.
  57. /// </summary>
  58. /// <param name="stream">The stream to identify.</param>
  59. /// <param name="offset">The archive beginning offset.</param>
  60. /// <param name="isExecutable">True if the original format of the stream is PE; otherwise, false.</param>
  61. /// <returns>Corresponding InArchiveFormat.</returns>
  62. public static InArchiveFormat CheckSignature(Stream stream, out int offset, out bool isExecutable)
  63. {
  64. offset = 0;
  65. if (!stream.CanRead)
  66. {
  67. throw new ArgumentException("The stream must be readable.");
  68. }
  69. if (stream.Length < SIGNATURE_SIZE)
  70. {
  71. throw new ArgumentException("The stream is invalid.");
  72. }
  73. #region Get file signature
  74. var signature = new byte[SIGNATURE_SIZE];
  75. int bytesRequired = SIGNATURE_SIZE;
  76. int index = 0;
  77. stream.Seek(0, SeekOrigin.Begin);
  78. while (bytesRequired > 0)
  79. {
  80. int bytesRead = stream.Read(signature, index, bytesRequired);
  81. bytesRequired -= bytesRead;
  82. index += bytesRead;
  83. }
  84. string actualSignature = BitConverter.ToString(signature);
  85. #endregion
  86. InArchiveFormat suspectedFormat = InArchiveFormat.XZ; // any except PE and Cab
  87. isExecutable = false;
  88. foreach (string expectedSignature in Formats.InSignatureFormats.Keys)
  89. {
  90. if (actualSignature.StartsWith(expectedSignature, StringComparison.OrdinalIgnoreCase) ||
  91. actualSignature.Substring(6).StartsWith(expectedSignature, StringComparison.OrdinalIgnoreCase) &&
  92. Formats.InSignatureFormats[expectedSignature] == InArchiveFormat.Lzh)
  93. {
  94. if (Formats.InSignatureFormats[expectedSignature] == InArchiveFormat.PE)
  95. {
  96. suspectedFormat = InArchiveFormat.PE;
  97. isExecutable = true;
  98. }
  99. else
  100. {
  101. return Formats.InSignatureFormats[expectedSignature];
  102. }
  103. }
  104. }
  105. // Many Microsoft formats
  106. if (actualSignature.StartsWith("D0-CF-11-E0-A1-B1-1A-E1", StringComparison.OrdinalIgnoreCase))
  107. {
  108. suspectedFormat = InArchiveFormat.Cab; // != InArchiveFormat.XZ
  109. }
  110. #region SpecialDetect
  111. try
  112. {
  113. SpecialDetect(stream, 257, InArchiveFormat.Tar);
  114. }
  115. catch (ArgumentException) {}
  116. if (SpecialDetect(stream, 0x8001, InArchiveFormat.Iso))
  117. {
  118. return InArchiveFormat.Iso;
  119. }
  120. if (SpecialDetect(stream, 0x8801, InArchiveFormat.Iso))
  121. {
  122. return InArchiveFormat.Iso;
  123. }
  124. if (SpecialDetect(stream, 0x9001, InArchiveFormat.Iso))
  125. {
  126. return InArchiveFormat.Iso;
  127. }
  128. if (SpecialDetect(stream, 0x9001, InArchiveFormat.Iso))
  129. {
  130. return InArchiveFormat.Iso;
  131. }
  132. if (SpecialDetect(stream, 0x400, InArchiveFormat.Hfs))
  133. {
  134. return InArchiveFormat.Hfs;
  135. }
  136. #region Last resort for tar - can mistake
  137. if (stream.Length >= 1024)
  138. {
  139. stream.Seek(-1024, SeekOrigin.End);
  140. byte[] buf = new byte[1024];
  141. stream.Read(buf, 0, 1024);
  142. bool istar = true;
  143. for (int i = 0; i < 1024; i++)
  144. {
  145. istar = istar && buf[i] == 0;
  146. }
  147. if (istar)
  148. {
  149. return InArchiveFormat.Tar;
  150. }
  151. }
  152. #endregion
  153. #endregion
  154. #region Check if it is an SFX archive or a file with an embedded archive.
  155. if (suspectedFormat != InArchiveFormat.XZ)
  156. {
  157. #region Get first Min(stream.Length, SFX_SCAN_LENGTH) bytes
  158. var scanLength = Math.Min(stream.Length, SFX_SCAN_LENGTH);
  159. signature = new byte[scanLength];
  160. bytesRequired = (int)scanLength;
  161. index = 0;
  162. stream.Seek(0, SeekOrigin.Begin);
  163. while (bytesRequired > 0)
  164. {
  165. int bytesRead = stream.Read(signature, index, bytesRequired);
  166. bytesRequired -= bytesRead;
  167. index += bytesRead;
  168. }
  169. actualSignature = BitConverter.ToString(signature);
  170. #endregion
  171. foreach (var format in new InArchiveFormat[]
  172. {
  173. InArchiveFormat.Zip,
  174. InArchiveFormat.SevenZip,
  175. InArchiveFormat.Rar,
  176. InArchiveFormat.Cab,
  177. InArchiveFormat.Arj
  178. })
  179. {
  180. int pos = actualSignature.IndexOf(Formats.InSignatureFormatsReversed[format]);
  181. if (pos > -1)
  182. {
  183. offset = pos / 3;
  184. return format;
  185. }
  186. }
  187. // Nothing
  188. if (suspectedFormat == InArchiveFormat.PE)
  189. {
  190. return InArchiveFormat.PE;
  191. }
  192. }
  193. #endregion
  194. throw new ArgumentException("The stream is invalid or no corresponding signature was found.");
  195. }
  196. /// <summary>
  197. /// Gets the InArchiveFormat for a specific file name.
  198. /// </summary>
  199. /// <param name="fileName">The archive file name.</param>
  200. /// <param name="offset">The archive beginning offset.</param>
  201. /// <param name="isExecutable">True if the original format of the file is PE; otherwise, false.</param>
  202. /// <returns>Corresponding InArchiveFormat.</returns>
  203. /// <exception cref="System.ArgumentException"/>
  204. public static InArchiveFormat CheckSignature(string fileName, out int offset, out bool isExecutable)
  205. {
  206. using (var fs = new FileStream(fileName, FileMode.Open, FileAccess.Read, FileShare.ReadWrite))
  207. {
  208. try
  209. {
  210. return CheckSignature(fs, out offset, out isExecutable);
  211. }
  212. catch (ArgumentException)
  213. {
  214. offset = 0;
  215. isExecutable = false;
  216. return Formats.FormatByFileName(fileName, true);
  217. }
  218. }
  219. }
  220. }
  221. #endif
  222. }