upstream/mercurial-mirror Commit - r52746:4777378f

1

use std::collections::{HashMap, HashSet};

1

use std::collections::{HashMap, HashSet};

2

use std::fmt::Debug;

2

use std::fmt::Debug;

3

use std::ops::Deref;

3

use std::ops::Deref;

4

use std::sync::{RwLock, RwLockReadGuard, RwLockWriteGuard};

4

use std::sync::{RwLock, RwLockReadGuard, RwLockWriteGuard};

5

6

use bitvec::prelude::*;

6

use bitvec::prelude::*;

7

use byteorder::{BigEndian, ByteOrder};

7

use byteorder::{BigEndian, ByteOrder};

8

use bytes_cast::{unaligned, BytesCast};

8

use bytes_cast::{unaligned, BytesCast};

9

10

use super::REVIDX_KNOWN_FLAGS;

10

use super::REVIDX_KNOWN_FLAGS;

11

use crate::errors::HgError;

11

use crate::errors::HgError;

12

use crate::node::{NODE_BYTES_LENGTH, NULL_NODE, STORED_NODE_ID_BYTES};

12

use crate::node::{NODE_BYTES_LENGTH, NULL_NODE, STORED_NODE_ID_BYTES};

13

use crate::revlog::node::Node;

13

use crate::revlog::node::Node;

14

use crate::revlog::{Revision, NULL_REVISION};

14

use crate::revlog::{Revision, NULL_REVISION};

15

use crate::{

15

use crate::{

16

dagops, BaseRevision, FastHashMap, Graph, GraphError, RevlogError,

16

dagops, BaseRevision, FastHashMap, Graph, GraphError, RevlogError,

17

RevlogIndex, UncheckedRevision,

17

RevlogIndex, UncheckedRevision,

18

};

18

};

19

20

pub const INDEX_ENTRY_SIZE: usize = 64;

20

pub const INDEX_ENTRY_SIZE: usize = 64;

21

pub const INDEX_HEADER_SIZE: usize = 4;

21

pub const INDEX_HEADER_SIZE: usize = 4;

22

pub const COMPRESSION_MODE_INLINE: u8 = 2;

22

pub const COMPRESSION_MODE_INLINE: u8 = 2;

23

24

#[derive(Debug)]

24

#[derive(Debug)]

25

pub struct IndexHeader {

25

pub struct IndexHeader {

26

pub(super) header_bytes: [u8; INDEX_HEADER_SIZE],

26

pub(super) header_bytes: [u8; INDEX_HEADER_SIZE],

27

}

27

}

28

29

#[derive(Copy, Clone)]

29

#[derive(Copy, Clone, Debug)]

30

pub struct IndexHeaderFlags {

30

pub struct IndexHeaderFlags {

31

flags: u16,

31

flags: u16,

32

}

32

}

33

34

/// Corresponds to the high bits of `_format_flags` in python

34

/// Corresponds to the high bits of `_format_flags` in python

35

impl IndexHeaderFlags {

35

impl IndexHeaderFlags {

36

/// Corresponds to FLAG_INLINE_DATA in python

36

/// Corresponds to FLAG_INLINE_DATA in python

37

pub fn is_inline(self) -> bool {

37

pub fn is_inline(self) -> bool {

38

self.flags & 1 != 0

38

self.flags & 1 != 0

39

}

39

}

40

/// Corresponds to FLAG_GENERALDELTA in python

40

/// Corresponds to FLAG_GENERALDELTA in python

41

pub fn uses_generaldelta(self) -> bool {

41

pub fn uses_generaldelta(self) -> bool {

42

self.flags & 2 != 0

42

self.flags & 2 != 0

43

}

43

}

44

}

44

}

45

46

/// Corresponds to the INDEX_HEADER structure,

46

/// Corresponds to the INDEX_HEADER structure,

47

/// which is parsed as a `header` variable in `_loadindex` in `revlog.py`

47

/// which is parsed as a `header` variable in `_loadindex` in `revlog.py`

48

impl IndexHeader {

48

impl IndexHeader {

49

fn format_flags(&self) -> IndexHeaderFlags {

49

fn format_flags(&self) -> IndexHeaderFlags {

50

// No "unknown flags" check here, unlike in python. Maybe there should

50

// No "unknown flags" check here, unlike in python. Maybe there should

51

// be.

51

// be.

52

IndexHeaderFlags {

52

IndexHeaderFlags {

53

flags: BigEndian::read_u16(&self.header_bytes[0..2]),

53

flags: BigEndian::read_u16(&self.header_bytes[0..2]),

54

}

54

}

55

}

55

}

56

57

/// The only revlog version currently supported by rhg.

57

/// The only revlog version currently supported by rhg.

58

const REVLOGV1: u16 = 1;

58

const REVLOGV1: u16 = 1;

59

60

/// Corresponds to `_format_version` in Python.

60

/// Corresponds to `_format_version` in Python.

61

fn format_version(&self) -> u16 {

61

fn format_version(&self) -> u16 {

62

BigEndian::read_u16(&self.header_bytes[2..4])

62

BigEndian::read_u16(&self.header_bytes[2..4])

63

}

63

}

64

65

pub fn parse(index_bytes: &[u8]) -> Result<Option<IndexHeader>, HgError> {

65

pub fn parse(index_bytes: &[u8]) -> Result<Option<IndexHeader>, HgError> {

66

if index_bytes.is_empty() {

66

if index_bytes.is_empty() {

67

return Ok(None);

67

return Ok(None);

68

}

68

}

69

if index_bytes.len() < 4 {

69

if index_bytes.len() < 4 {

70

return Err(HgError::corrupted(

70

return Err(HgError::corrupted(

71

"corrupted revlog: can't read the index format header",

71

"corrupted revlog: can't read the index format header",

72

));

72

));

73

}

73

}

74

Ok(Some(IndexHeader {

74

Ok(Some(IndexHeader {

75

header_bytes: {

75

header_bytes: {

76

let bytes: [u8; 4] =

76

let bytes: [u8; 4] =

77

index_bytes[0..4].try_into().expect("impossible");

77

index_bytes[0..4].try_into().expect("impossible");

78

bytes

78

bytes

79

},

79

},

80

}))

80

}))

81

}

81

}

82

}

82

}

83

84

/// Abstracts the access to the index bytes since they can be spread between

84

/// Abstracts the access to the index bytes since they can be spread between

85

/// the immutable (bytes) part and the mutable (added) part if any appends

85

/// the immutable (bytes) part and the mutable (added) part if any appends

86

/// happened. This makes it transparent for the callers.

86

/// happened. This makes it transparent for the callers.

87

struct IndexData {

87

struct IndexData {

88

/// Immutable bytes, most likely taken from disk

88

/// Immutable bytes, most likely taken from disk

89

bytes: Box<dyn Deref<Target = [u8]> + Send + Sync>,

89

bytes: Box<dyn Deref<Target = [u8]> + Send + Sync>,

90

/// Used when stripping index contents, keeps track of the start of the

90

/// Used when stripping index contents, keeps track of the start of the

91

/// first stripped revision, which is used to give a slice of the

91

/// first stripped revision, which is used to give a slice of the

92

/// `bytes` field.

92

/// `bytes` field.

93

truncation: Option<usize>,

93

truncation: Option<usize>,

94

/// Bytes that were added after reading the index

94

/// Bytes that were added after reading the index

95

added: Vec<u8>,

95

added: Vec<u8>,

96

first_entry: [u8; INDEX_ENTRY_SIZE],

96

first_entry: [u8; INDEX_ENTRY_SIZE],

97

}

97

}

98

99

impl IndexData {

99

impl IndexData {

100

pub fn new(bytes: Box<dyn Deref<Target = [u8]> + Send + Sync>) -> Self {

100

pub fn new(bytes: Box<dyn Deref<Target = [u8]> + Send + Sync>) -> Self {

101

let mut first_entry = [0; INDEX_ENTRY_SIZE];

101

let mut first_entry = [0; INDEX_ENTRY_SIZE];

102

if bytes.len() >= INDEX_ENTRY_SIZE {

102

if bytes.len() >= INDEX_ENTRY_SIZE {

103

first_entry[INDEX_HEADER_SIZE..]

103

first_entry[INDEX_HEADER_SIZE..]

104

.copy_from_slice(&bytes[INDEX_HEADER_SIZE..INDEX_ENTRY_SIZE])

104

.copy_from_slice(&bytes[INDEX_HEADER_SIZE..INDEX_ENTRY_SIZE])

105

}

105

}

106

Self {

106

Self {

107

bytes,

107

bytes,

108

truncation: None,

108

truncation: None,

109

added: vec![],

109

added: vec![],

110

first_entry,

110

first_entry,

111

}

111

}

112

}

112

}

113

114

pub fn len(&self) -> usize {

114

pub fn len(&self) -> usize {

115

match self.truncation {

115

match self.truncation {

116

Some(truncation) => truncation + self.added.len(),

116

Some(truncation) => truncation + self.added.len(),

117

None => self.bytes.len() + self.added.len(),

117

None => self.bytes.len() + self.added.len(),

118

}

118

}

119

}

119

}

120

121

fn remove(

121

fn remove(

122

&mut self,

122

&mut self,

123

rev: Revision,

123

rev: Revision,

124

offsets: Option<&[usize]>,

124

offsets: Option<&[usize]>,

125

) -> Result<(), RevlogError> {

125

) -> Result<(), RevlogError> {

126

let rev = rev.0 as usize;

126

let rev = rev.0 as usize;

127

let truncation = if let Some(offsets) = offsets {

127

let truncation = if let Some(offsets) = offsets {

128

offsets[rev]

128

offsets[rev]

129

} else {

129

} else {

130

rev * INDEX_ENTRY_SIZE

130

rev * INDEX_ENTRY_SIZE

131

};

131

};

132

if truncation < self.bytes.len() {

132

if truncation < self.bytes.len() {

133

self.truncation = Some(truncation);

133

self.truncation = Some(truncation);

134

self.added.clear();

134

self.added.clear();

135

} else {

135

} else {

136

self.added.truncate(truncation - self.bytes.len());

136

self.added.truncate(truncation - self.bytes.len());

137

}

137

}

138

Ok(())

138

Ok(())

139

}

139

}

140

141

fn is_new(&self) -> bool {

141

fn is_new(&self) -> bool {

142

self.bytes.is_empty()

142

self.bytes.is_empty()

143

}

143

}

144

}

144

}

145

146

impl std::ops::Index<std::ops::Range<usize>> for IndexData {

146

impl std::ops::Index<std::ops::Range<usize>> for IndexData {

147

type Output = [u8];

147

type Output = [u8];

148

149

fn index(&self, index: std::ops::Range<usize>) -> &Self::Output {

149

fn index(&self, index: std::ops::Range<usize>) -> &Self::Output {

150

let start = index.start;

150

let start = index.start;

151

let end = index.end;

151

let end = index.end;

152

let immutable_len = match self.truncation {

152

let immutable_len = match self.truncation {

153

Some(truncation) => truncation,

153

Some(truncation) => truncation,

154

None => self.bytes.len(),

154

None => self.bytes.len(),

155

};

155

};

156

if start < immutable_len {

156

if start < immutable_len {

157

if end > immutable_len {

157

if end > immutable_len {

158

panic!("index data cannot span existing and added ranges");

158

panic!("index data cannot span existing and added ranges");

159

}

159

}

160

&self.bytes[index]

160

&self.bytes[index]

161

} else {

161

} else {

162

&self.added[start - immutable_len..end - immutable_len]

162

&self.added[start - immutable_len..end - immutable_len]

163

}

163

}

164

}

164

}

165

}

165

}

166

167

#[derive(Debug, PartialEq, Eq)]

167

#[derive(Debug, PartialEq, Eq)]

168

pub struct RevisionDataParams {

168

pub struct RevisionDataParams {

169

pub flags: u16,

169

pub flags: u16,

170

pub data_offset: u64,

170

pub data_offset: u64,

171

pub data_compressed_length: i32,

171

pub data_compressed_length: i32,

172

pub data_uncompressed_length: i32,

172

pub data_uncompressed_length: i32,

173

pub data_delta_base: i32,

173

pub data_delta_base: i32,

174

pub link_rev: i32,

174

pub link_rev: i32,

175

pub parent_rev_1: i32,

175

pub parent_rev_1: i32,

176

pub parent_rev_2: i32,

176

pub parent_rev_2: i32,

177

pub node_id: [u8; NODE_BYTES_LENGTH],

177

pub node_id: [u8; NODE_BYTES_LENGTH],

178

pub _sidedata_offset: u64,

178

pub _sidedata_offset: u64,

179

pub _sidedata_compressed_length: i32,

179

pub _sidedata_compressed_length: i32,

180

pub data_compression_mode: u8,

180

pub data_compression_mode: u8,

181

pub _sidedata_compression_mode: u8,

181

pub _sidedata_compression_mode: u8,

182

pub _rank: i32,

182

pub _rank: i32,

183

}

183

}

184

185

impl Default for RevisionDataParams {

185

impl Default for RevisionDataParams {

186

fn default() -> Self {

186

fn default() -> Self {

187

Self {

187

Self {

188

flags: 0,

188

flags: 0,

189

data_offset: 0,

189

data_offset: 0,

190

data_compressed_length: 0,

190

data_compressed_length: 0,

191

data_uncompressed_length: 0,

191

data_uncompressed_length: 0,

192

data_delta_base: -1,

192

data_delta_base: -1,

193

link_rev: -1,

193

link_rev: -1,

194

parent_rev_1: -1,

194

parent_rev_1: -1,

195

parent_rev_2: -1,

195

parent_rev_2: -1,

196

node_id: [0; NODE_BYTES_LENGTH],

196

node_id: [0; NODE_BYTES_LENGTH],

197

_sidedata_offset: 0,

197

_sidedata_offset: 0,

198

_sidedata_compressed_length: 0,

198

_sidedata_compressed_length: 0,

199

data_compression_mode: COMPRESSION_MODE_INLINE,

199

data_compression_mode: COMPRESSION_MODE_INLINE,

200

_sidedata_compression_mode: COMPRESSION_MODE_INLINE,

200

_sidedata_compression_mode: COMPRESSION_MODE_INLINE,

201

_rank: -1,

201

_rank: -1,

202

}

202

}

203

}

203

}

204

}

204

}

205

206

#[derive(BytesCast)]

206

#[derive(BytesCast)]

207

#[repr(C)]

207

#[repr(C)]

208

pub struct RevisionDataV1 {

208

pub struct RevisionDataV1 {

209

data_offset_or_flags: unaligned::U64Be,

209

data_offset_or_flags: unaligned::U64Be,

210

data_compressed_length: unaligned::I32Be,

210

data_compressed_length: unaligned::I32Be,

211

data_uncompressed_length: unaligned::I32Be,

211

data_uncompressed_length: unaligned::I32Be,

212

data_delta_base: unaligned::I32Be,

212

data_delta_base: unaligned::I32Be,

213

link_rev: unaligned::I32Be,

213

link_rev: unaligned::I32Be,

214

parent_rev_1: unaligned::I32Be,

214

parent_rev_1: unaligned::I32Be,

215

parent_rev_2: unaligned::I32Be,

215

parent_rev_2: unaligned::I32Be,

216

node_id: [u8; STORED_NODE_ID_BYTES],

216

node_id: [u8; STORED_NODE_ID_BYTES],

217

}

217

}

218

219

fn _static_assert_size_of_revision_data_v1() {

219

fn _static_assert_size_of_revision_data_v1() {

220

let _ = std::mem::transmute::<RevisionDataV1, [u8; 64]>;

220

let _ = std::mem::transmute::<RevisionDataV1, [u8; 64]>;

221

}

221

}

222

223

impl RevisionDataParams {

223

impl RevisionDataParams {

224

pub fn validate(&self) -> Result<(), RevlogError> {

224

pub fn validate(&self) -> Result<(), RevlogError> {

225

if self.flags & !REVIDX_KNOWN_FLAGS != 0 {

225

if self.flags & !REVIDX_KNOWN_FLAGS != 0 {

226

return Err(RevlogError::corrupted(format!(

226

return Err(RevlogError::corrupted(format!(

227

"unknown revlog index flags: {}",

227

"unknown revlog index flags: {}",

228

self.flags

228

self.flags

229

)));

229

)));

230

}

230

}

231

if self.data_compression_mode != COMPRESSION_MODE_INLINE {

231

if self.data_compression_mode != COMPRESSION_MODE_INLINE {

232

return Err(RevlogError::corrupted(format!(

232

return Err(RevlogError::corrupted(format!(

233

"invalid data compression mode: {}",

233

"invalid data compression mode: {}",

234

self.data_compression_mode

234

self.data_compression_mode

235

)));

235

)));

236

}

236

}

237

// FIXME isn't this only for v2 or changelog v2?

237

// FIXME isn't this only for v2 or changelog v2?

238

if self._sidedata_compression_mode != COMPRESSION_MODE_INLINE {

238

if self._sidedata_compression_mode != COMPRESSION_MODE_INLINE {

239

return Err(RevlogError::corrupted(format!(

239

return Err(RevlogError::corrupted(format!(

240

"invalid sidedata compression mode: {}",

240

"invalid sidedata compression mode: {}",

241

self._sidedata_compression_mode

241

self._sidedata_compression_mode

242

)));

242

)));

243

}

243

}

244

Ok(())

244

Ok(())

245

}

245

}

246

247

pub fn into_v1(self) -> RevisionDataV1 {

247

pub fn into_v1(self) -> RevisionDataV1 {

248

let data_offset_or_flags = self.data_offset << 16 | self.flags as u64;

248

let data_offset_or_flags = self.data_offset << 16 | self.flags as u64;

249

let mut node_id = [0; STORED_NODE_ID_BYTES];

249

let mut node_id = [0; STORED_NODE_ID_BYTES];

250

node_id[..NODE_BYTES_LENGTH].copy_from_slice(&self.node_id);

250

node_id[..NODE_BYTES_LENGTH].copy_from_slice(&self.node_id);

251

RevisionDataV1 {

251

RevisionDataV1 {

252

data_offset_or_flags: data_offset_or_flags.into(),

252

data_offset_or_flags: data_offset_or_flags.into(),

253

data_compressed_length: self.data_compressed_length.into(),

253

data_compressed_length: self.data_compressed_length.into(),

254

data_uncompressed_length: self.data_uncompressed_length.into(),

254

data_uncompressed_length: self.data_uncompressed_length.into(),

255

data_delta_base: self.data_delta_base.into(),

255

data_delta_base: self.data_delta_base.into(),

256

link_rev: self.link_rev.into(),

256

link_rev: self.link_rev.into(),

257

parent_rev_1: self.parent_rev_1.into(),

257

parent_rev_1: self.parent_rev_1.into(),

258

parent_rev_2: self.parent_rev_2.into(),

258

parent_rev_2: self.parent_rev_2.into(),

259

node_id,

259

node_id,

260

}

260

}

261

}

261

}

262

}

262

}

263

264

/// A Revlog index

264

/// A Revlog index

265

pub struct Index {

265

pub struct Index {

266

bytes: IndexData,

266

bytes: IndexData,

267

/// Offsets of starts of index blocks.

267

/// Offsets of starts of index blocks.

268

/// Only needed when the index is interleaved with data.

268

/// Only needed when the index is interleaved with data.

269

offsets: RwLock<Option<Vec<usize>>>,

269

offsets: RwLock<Option<Vec<usize>>>,

270

uses_generaldelta: bool,

270

uses_generaldelta: bool,

271

is_inline: bool,

271

is_inline: bool,

272

/// Cache of (head_revisions, filtered_revisions)

272

/// Cache of (head_revisions, filtered_revisions)

273

///

273

///

274

/// The head revisions in this index, kept in sync. Should

274

/// The head revisions in this index, kept in sync. Should

275

/// be accessed via the [`Self::head_revs`] method.

275

/// be accessed via the [`Self::head_revs`] method.

276

/// The last filtered revisions in this index, used to make sure

276

/// The last filtered revisions in this index, used to make sure

277

/// we haven't changed filters when returning the cached `head_revs`.

277

/// we haven't changed filters when returning the cached `head_revs`.

278

head_revs: RwLock<(Vec<Revision>, HashSet<Revision>)>,

278

head_revs: RwLock<(Vec<Revision>, HashSet<Revision>)>,

279

}

279

}

280

281

impl Debug for Index {

281

impl Debug for Index {

282

fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {

282

fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {

283

f.debug_struct("Index")

283

f.debug_struct("Index")

284

.field("offsets", &self.offsets)

284

.field("offsets", &self.offsets)

285

.field("uses_generaldelta", &self.uses_generaldelta)

285

.field("uses_generaldelta", &self.uses_generaldelta)

286

.finish()

286

.finish()

287

}

287

}

288

}

288

}

289

290

impl Graph for Index {

290

impl Graph for Index {

291

#[inline(always)]

291

#[inline(always)]

292

fn parents(&self, rev: Revision) -> Result<[Revision; 2], GraphError> {

292

fn parents(&self, rev: Revision) -> Result<[Revision; 2], GraphError> {

293

let err = || GraphError::ParentOutOfRange(rev);

293

let err = || GraphError::ParentOutOfRange(rev);

294

match self.get_entry(rev) {

294

match self.get_entry(rev) {

295

Some(entry) => {

295

Some(entry) => {

296

// The C implementation checks that the parents are valid

296

// The C implementation checks that the parents are valid

297

// before returning

297

// before returning

298

Ok([

298

Ok([

299

self.check_revision(entry.p1()).ok_or_else(err)?,

299

self.check_revision(entry.p1()).ok_or_else(err)?,

300

self.check_revision(entry.p2()).ok_or_else(err)?,

300

self.check_revision(entry.p2()).ok_or_else(err)?,

301

])

301

])

302

}

302

}

303

None => Ok([NULL_REVISION, NULL_REVISION]),

303

None => Ok([NULL_REVISION, NULL_REVISION]),

304

}

304

}

305

}

305

}

306

}

306

}

307

308

/// A cache suitable for find_snapshots

308

/// A cache suitable for find_snapshots

309

///

309

///

310

/// Logically equivalent to a mapping whose keys are [`BaseRevision`] and

310

/// Logically equivalent to a mapping whose keys are [`BaseRevision`] and

311

/// values sets of [`BaseRevision`]

311

/// values sets of [`BaseRevision`]

312

///

312

///

313

/// TODO the dubious part is insisting that errors must be RevlogError

313

/// TODO the dubious part is insisting that errors must be RevlogError

314

/// we would probably need to sprinkle some magic here, such as an associated

314

/// we would probably need to sprinkle some magic here, such as an associated

315

/// type that would be Into<RevlogError> but even that would not be

315

/// type that would be Into<RevlogError> but even that would not be

316

/// satisfactory, as errors potentially have nothing to do with the revlog.

316

/// satisfactory, as errors potentially have nothing to do with the revlog.

317

pub trait SnapshotsCache {

317

pub trait SnapshotsCache {

318

fn insert_for(

318

fn insert_for(

319

&mut self,

319

&mut self,

320

rev: BaseRevision,

320

rev: BaseRevision,

321

value: BaseRevision,

321

value: BaseRevision,

322

) -> Result<(), RevlogError>;

322

) -> Result<(), RevlogError>;

323

}

323

}

324

325

impl SnapshotsCache for FastHashMap<BaseRevision, HashSet<BaseRevision>> {

325

impl SnapshotsCache for FastHashMap<BaseRevision, HashSet<BaseRevision>> {

326

fn insert_for(

326

fn insert_for(

327

&mut self,

327

&mut self,

328

rev: BaseRevision,

328

rev: BaseRevision,

329

value: BaseRevision,

329

value: BaseRevision,

330

) -> Result<(), RevlogError> {

330

) -> Result<(), RevlogError> {

331

let all_values = self.entry(rev).or_default();

331

let all_values = self.entry(rev).or_default();

332

all_values.insert(value);

332

all_values.insert(value);

333

Ok(())

333

Ok(())

334

}

334

}

335

}

335

}

336

337

impl Index {

337

impl Index {

338

/// Create an index from bytes.

338

/// Create an index from bytes.

339

/// Calculate the start of each entry when is_inline is true.

339

/// Calculate the start of each entry when is_inline is true.

340

pub fn new(

340

pub fn new(

341

bytes: Box<dyn Deref<Target = [u8]> + Send + Sync>,

341

bytes: Box<dyn Deref<Target = [u8]> + Send + Sync>,

342

default_header: IndexHeader,

342

default_header: IndexHeader,

343

) -> Result<Self, HgError> {

343

) -> Result<Self, HgError> {

344

let header =

344

let header =

345

IndexHeader::parse(bytes.as_ref())?.unwrap_or(default_header);

345

IndexHeader::parse(bytes.as_ref())?.unwrap_or(default_header);

346

347

if header.format_version() != IndexHeader::REVLOGV1 {

347

if header.format_version() != IndexHeader::REVLOGV1 {

348

// A proper new version should have had a repo/store

348

// A proper new version should have had a repo/store

349

// requirement.

349

// requirement.

350

return Err(HgError::corrupted("unsupported revlog version"));

350

return Err(HgError::corrupted("unsupported revlog version"));

351

}

351

}

352

353

let uses_generaldelta = header.format_flags().uses_generaldelta();

353

let uses_generaldelta = header.format_flags().uses_generaldelta();

354

355

if header.format_flags().is_inline() {

355

if header.format_flags().is_inline() {

356

let mut offset: usize = 0;

356

let mut offset: usize = 0;

357

let mut offsets = Vec::new();

357

let mut offsets = Vec::new();

358

359

while offset + INDEX_ENTRY_SIZE <= bytes.len() {

359

while offset + INDEX_ENTRY_SIZE <= bytes.len() {

360

offsets.push(offset);

360

offsets.push(offset);

361

let end = offset + INDEX_ENTRY_SIZE;

361

let end = offset + INDEX_ENTRY_SIZE;

362

let entry = IndexEntry {

362

let entry = IndexEntry {

363

bytes: &bytes[offset..end],

363

bytes: &bytes[offset..end],

364

};

364

};

365

366

offset += INDEX_ENTRY_SIZE + entry.compressed_len() as usize;

366

offset += INDEX_ENTRY_SIZE + entry.compressed_len() as usize;

367

}

367

}

368

369

if offset == bytes.len() {

369

if offset == bytes.len() {

370

Ok(Self {

370

Ok(Self {

371

bytes: IndexData::new(bytes),

371

bytes: IndexData::new(bytes),

372

offsets: RwLock::new(Some(offsets)),

372

offsets: RwLock::new(Some(offsets)),

373

uses_generaldelta,

373

uses_generaldelta,

374

is_inline: true,

374

is_inline: true,

375

head_revs: RwLock::new((vec![], HashSet::new())),

375

head_revs: RwLock::new((vec![], HashSet::new())),

376

})

376

})

377

} else {

377

} else {

378

Err(HgError::corrupted("unexpected inline revlog length"))

378

Err(HgError::corrupted("unexpected inline revlog length"))

379

}

379

}

380

} else {

380

} else {

381

Ok(Self {

381

Ok(Self {

382

bytes: IndexData::new(bytes),

382

bytes: IndexData::new(bytes),

383

offsets: RwLock::new(None),

383

offsets: RwLock::new(None),

384

uses_generaldelta,

384

uses_generaldelta,

385

is_inline: false,

385

is_inline: false,

386

head_revs: RwLock::new((vec![], HashSet::new())),

386

head_revs: RwLock::new((vec![], HashSet::new())),

387

})

387

})

388

}

388

}

389

}

389

}

390

391

pub fn uses_generaldelta(&self) -> bool {

391

pub fn uses_generaldelta(&self) -> bool {

392

self.uses_generaldelta

392

self.uses_generaldelta

393

}

393

}

394

395

/// Value of the inline flag.

395

/// Value of the inline flag.

396

pub fn is_inline(&self) -> bool {

396

pub fn is_inline(&self) -> bool {

397

self.is_inline

397

self.is_inline

398

}

398

}

399

400

/// Return a slice of bytes if `revlog` is inline. Panic if not.

400

/// Return a slice of bytes if `revlog` is inline. Panic if not.

401

pub fn data(&self, start: usize, end: usize) -> &[u8] {

401

pub fn data(&self, start: usize, end: usize) -> &[u8] {

402

if !self.is_inline() {

402

if !self.is_inline() {

403

panic!("tried to access data in the index of a revlog that is not inline");

403

panic!("tried to access data in the index of a revlog that is not inline");

404

}

404

}

405

&self.bytes[start..end]

405

&self.bytes[start..end]

406

}

406

}

407

408

/// Return number of entries of the revlog index.

408

/// Return number of entries of the revlog index.

409

pub fn len(&self) -> usize {

409

pub fn len(&self) -> usize {

410

if self.is_inline() {

410

if self.is_inline() {

411

(*self.get_offsets())

411

(*self.get_offsets())

412

.as_ref()

412

.as_ref()

413

.expect("inline should have offsets")

413

.expect("inline should have offsets")

414

.len()

414

.len()

415

} else {

415

} else {

416

self.bytes.len() / INDEX_ENTRY_SIZE

416

self.bytes.len() / INDEX_ENTRY_SIZE

417

}

417

}

418

}

418

}

419

420

pub fn get_offsets(&self) -> RwLockReadGuard<Option<Vec<usize>>> {

420

pub fn get_offsets(&self) -> RwLockReadGuard<Option<Vec<usize>>> {

421

assert!(self.is_inline());

421

assert!(self.is_inline());

422

{

422

{

423

// Wrap in a block to drop the read guard

423

// Wrap in a block to drop the read guard

424

let mut offsets = self.offsets.write().unwrap();

424

let mut offsets = self.offsets.write().unwrap();

425

if offsets.is_none() {

425

if offsets.is_none() {

426

offsets.replace(inline_scan(&self.bytes.bytes).1);

426

offsets.replace(inline_scan(&self.bytes.bytes).1);

427

}

427

}

428

}

428

}

429

self.offsets.read().unwrap()

429

self.offsets.read().unwrap()

430

}

430

}

431

432

pub fn get_offsets_mut(&mut self) -> RwLockWriteGuard<Option<Vec<usize>>> {

432

pub fn get_offsets_mut(&mut self) -> RwLockWriteGuard<Option<Vec<usize>>> {

433

assert!(self.is_inline());

433

assert!(self.is_inline());

434

let mut offsets = self.offsets.write().unwrap();

434

let mut offsets = self.offsets.write().unwrap();

435

if offsets.is_none() {

435

if offsets.is_none() {

436

offsets.replace(inline_scan(&self.bytes.bytes).1);

436

offsets.replace(inline_scan(&self.bytes.bytes).1);

437

}

437

}

438

offsets

438

offsets

439

}

439

}

440

441

/// Returns `true` if the `Index` has zero `entries`.

441

/// Returns `true` if the `Index` has zero `entries`.

442

pub fn is_empty(&self) -> bool {

442

pub fn is_empty(&self) -> bool {

443

self.len() == 0

443

self.len() == 0

444

}

444

}

445

446

/// Return the index entry corresponding to the given revision or `None`

446

/// Return the index entry corresponding to the given revision or `None`

447

/// for [`NULL_REVISION`]

447

/// for [`NULL_REVISION`]

448

///

448

///

449

/// The specified revision being of the checked type, it always exists

449

/// The specified revision being of the checked type, it always exists

450

/// if it was validated by this index.

450

/// if it was validated by this index.

451

pub fn get_entry(&self, rev: Revision) -> Option<IndexEntry> {

451

pub fn get_entry(&self, rev: Revision) -> Option<IndexEntry> {

452

if rev == NULL_REVISION {

452

if rev == NULL_REVISION {

453

return None;

453

return None;

454

}

454

}

455

if rev.0 == 0 {

455

if rev.0 == 0 {

456

Some(IndexEntry {

456

Some(IndexEntry {

457

bytes: &self.bytes.first_entry[..],

457

bytes: &self.bytes.first_entry[..],

458

})

458

})

459

} else {

459

} else {

460

Some(if self.is_inline() {

460

Some(if self.is_inline() {

461

self.get_entry_inline(rev)

461

self.get_entry_inline(rev)

462

} else {

462

} else {

463

self.get_entry_separated(rev)

463

self.get_entry_separated(rev)

464

})

464

})

465

}

465

}

466

}

466

}

467

468

/// Return the binary content of the index entry for the given revision

468

/// Return the binary content of the index entry for the given revision

469

///

469

///

470

/// See [get_entry()](`Self::get_entry()`) for cases when `None` is

470

/// See [get_entry()](`Self::get_entry()`) for cases when `None` is

471

/// returned.

471

/// returned.

472

pub fn entry_binary(&self, rev: Revision) -> Option<&[u8]> {

472

pub fn entry_binary(&self, rev: Revision) -> Option<&[u8]> {

473

self.get_entry(rev).map(|e| {

473

self.get_entry(rev).map(|e| {

474

let bytes = e.as_bytes();

474

let bytes = e.as_bytes();

475

if rev.0 == 0 {

475

if rev.0 == 0 {

476

&bytes[4..]

476

&bytes[4..]

477

} else {

477

} else {

478

bytes

478

bytes

479

}

479

}

480

})

480

})

481

}

481

}

482

483

pub fn entry_as_params(

483

pub fn entry_as_params(

484

&self,

484

&self,

485

rev: UncheckedRevision,

485

rev: UncheckedRevision,

486

) -> Option<RevisionDataParams> {

486

) -> Option<RevisionDataParams> {

487

let rev = self.check_revision(rev)?;

487

let rev = self.check_revision(rev)?;

488

self.get_entry(rev).map(|e| RevisionDataParams {

488

self.get_entry(rev).map(|e| RevisionDataParams {

489

flags: e.flags(),

489

flags: e.flags(),

490

data_offset: if rev.0 == 0 && !self.bytes.is_new() {

490

data_offset: if rev.0 == 0 && !self.bytes.is_new() {

491

e.flags() as u64

491

e.flags() as u64

492

} else {

492

} else {

493

e.raw_offset()

493

e.raw_offset()

494

},

494

},

495

data_compressed_length: e

495

data_compressed_length: e

496

.compressed_len()

496

.compressed_len()

497

.try_into()

497

.try_into()

498

.unwrap_or_else(|_| {

498

.unwrap_or_else(|_| {

499

// Python's `unionrepo` sets the compressed length to be

499

// Python's `unionrepo` sets the compressed length to be

500

// `-1` (or `u32::MAX` if transmuted to `u32`) because it

500

// `-1` (or `u32::MAX` if transmuted to `u32`) because it

501

// cannot know the correct compressed length of a given

501

// cannot know the correct compressed length of a given

502

// revision. I'm not sure if this is true, but having this

502

// revision. I'm not sure if this is true, but having this

503

// edge case won't hurt other use cases, let's handle it.

503

// edge case won't hurt other use cases, let's handle it.

504

assert_eq!(e.compressed_len(), u32::MAX);

504

assert_eq!(e.compressed_len(), u32::MAX);

505

NULL_REVISION.0

505

NULL_REVISION.0

506

}),

506

}),

507

data_uncompressed_length: e.uncompressed_len(),

507

data_uncompressed_length: e.uncompressed_len(),

508

data_delta_base: e.base_revision_or_base_of_delta_chain().0,

508

data_delta_base: e.base_revision_or_base_of_delta_chain().0,

509

link_rev: e.link_revision().0,

509

link_rev: e.link_revision().0,

510

parent_rev_1: e.p1().0,

510

parent_rev_1: e.p1().0,

511

parent_rev_2: e.p2().0,

511

parent_rev_2: e.p2().0,

512

node_id: e.hash().as_bytes().try_into().unwrap(),

512

node_id: e.hash().as_bytes().try_into().unwrap(),

513

..Default::default()

513

..Default::default()

514

})

514

})

515

}

515

}

516

517

fn get_entry_inline(&self, rev: Revision) -> IndexEntry {

517

fn get_entry_inline(&self, rev: Revision) -> IndexEntry {

518

let offsets = &self.get_offsets();

518

let offsets = &self.get_offsets();

519

let offsets = offsets.as_ref().expect("inline should have offsets");

519

let offsets = offsets.as_ref().expect("inline should have offsets");

520

let start = offsets[rev.0 as usize];

520

let start = offsets[rev.0 as usize];

521

let end = start + INDEX_ENTRY_SIZE;

521

let end = start + INDEX_ENTRY_SIZE;

522

let bytes = &self.bytes[start..end];

522

let bytes = &self.bytes[start..end];

523

524

IndexEntry { bytes }

524

IndexEntry { bytes }

525

}

525

}

526

527

fn get_entry_separated(&self, rev: Revision) -> IndexEntry {

527

fn get_entry_separated(&self, rev: Revision) -> IndexEntry {

528

let start = rev.0 as usize * INDEX_ENTRY_SIZE;

528

let start = rev.0 as usize * INDEX_ENTRY_SIZE;

529

let end = start + INDEX_ENTRY_SIZE;

529

let end = start + INDEX_ENTRY_SIZE;

530

let bytes = &self.bytes[start..end];

530

let bytes = &self.bytes[start..end];

531

532

IndexEntry { bytes }

532

IndexEntry { bytes }

533

}

533

}

534

535

fn null_entry(&self) -> IndexEntry {

535

fn null_entry(&self) -> IndexEntry {

536

IndexEntry {

536

IndexEntry {

537

bytes: &[0; INDEX_ENTRY_SIZE],

537

bytes: &[0; INDEX_ENTRY_SIZE],

538

}

538

}

539

}

539

}

540

541

/// Return the head revisions of this index

541

/// Return the head revisions of this index

542

pub fn head_revs(&self) -> Result<Vec<Revision>, GraphError> {

542

pub fn head_revs(&self) -> Result<Vec<Revision>, GraphError> {

543

self.head_revs_filtered(&HashSet::new(), false)

543

self.head_revs_filtered(&HashSet::new(), false)

544

.map(|h| h.unwrap())

544

.map(|h| h.unwrap())

545

}

545

}

546

547

/// Python-specific shortcut to save on PyList creation

547

/// Python-specific shortcut to save on PyList creation

548

pub fn head_revs_shortcut(

548

pub fn head_revs_shortcut(

549

&self,

549

&self,

550

) -> Result<Option<Vec<Revision>>, GraphError> {

550

) -> Result<Option<Vec<Revision>>, GraphError> {

551

self.head_revs_filtered(&HashSet::new(), true)

551

self.head_revs_filtered(&HashSet::new(), true)

552

}

552

}

553

554

/// Return the heads removed and added by advancing from `begin` to `end`.

554

/// Return the heads removed and added by advancing from `begin` to `end`.

555

/// In revset language, we compute:

555

/// In revset language, we compute:

556

/// - `heads(:begin)-heads(:end)`

556

/// - `heads(:begin)-heads(:end)`

557

/// - `heads(:end)-heads(:begin)`

557

/// - `heads(:end)-heads(:begin)`

558

pub fn head_revs_diff(

558

pub fn head_revs_diff(

559

&self,

559

&self,

560

begin: Revision,

560

begin: Revision,

561

end: Revision,

561

end: Revision,

562

) -> Result<(Vec<Revision>, Vec<Revision>), GraphError> {

562

) -> Result<(Vec<Revision>, Vec<Revision>), GraphError> {

563

let mut heads_added = vec![];

563

let mut heads_added = vec![];

564

let mut heads_removed = vec![];

564

let mut heads_removed = vec![];

565

566

let mut acc = HashSet::new();

566

let mut acc = HashSet::new();

567

let Revision(begin) = begin;

567

let Revision(begin) = begin;

568

let Revision(end) = end;

568

let Revision(end) = end;

569

let mut i = end;

569

let mut i = end;

570

571

while i > begin {

571

while i > begin {

572

// acc invariant:

572

// acc invariant:

573

// `j` is in the set iff `j <= i` and it has children

573

// `j` is in the set iff `j <= i` and it has children

574

// among `i+1..end` (inclusive)

574

// among `i+1..end` (inclusive)

575

if !acc.remove(&i) {

575

if !acc.remove(&i) {

576

heads_added.push(Revision(i));

576

heads_added.push(Revision(i));

577

}

577

}

578

for Revision(parent) in self.parents(Revision(i))? {

578

for Revision(parent) in self.parents(Revision(i))? {

579

acc.insert(parent);

579

acc.insert(parent);

580

}

580

}

581

i -= 1;

581

i -= 1;

582

}

582

}

583

584

// At this point `acc` contains old revisions that gained new children.

584

// At this point `acc` contains old revisions that gained new children.

585

// We need to check if they had any children before. If not, those

585

// We need to check if they had any children before. If not, those

586

// revisions are the removed heads.

586

// revisions are the removed heads.

587

while !acc.is_empty() {

587

while !acc.is_empty() {

588

// acc invariant:

588

// acc invariant:

589

// `j` is in the set iff `j <= i` and it has children

589

// `j` is in the set iff `j <= i` and it has children

590

// among `begin+1..end`, but not among `i+1..begin` (inclusive)

590

// among `begin+1..end`, but not among `i+1..begin` (inclusive)

591

592

assert!(i >= -1); // yes, `-1` can also be a head if the repo is empty

592

assert!(i >= -1); // yes, `-1` can also be a head if the repo is empty

593

if acc.remove(&i) {

593

if acc.remove(&i) {

594

heads_removed.push(Revision(i));

594

heads_removed.push(Revision(i));

595

}

595

}

596

for Revision(parent) in self.parents(Revision(i))? {

596

for Revision(parent) in self.parents(Revision(i))? {

597

acc.remove(&parent);

597

acc.remove(&parent);

598

}

598

}

599

i -= 1;

599

i -= 1;

600

}

600

}

601

602

Ok((heads_removed, heads_added))

602

Ok((heads_removed, heads_added))

603

}

603

}

604

605

/// Return the head revisions of this index

605

/// Return the head revisions of this index

606

pub fn head_revs_filtered(

606

pub fn head_revs_filtered(

607

&self,

607

&self,

608

filtered_revs: &HashSet<Revision>,

608

filtered_revs: &HashSet<Revision>,

609

py_shortcut: bool,

609

py_shortcut: bool,

610

) -> Result<Option<Vec<Revision>>, GraphError> {

610

) -> Result<Option<Vec<Revision>>, GraphError> {

611

{

611

{

612

let guard = self

612

let guard = self

613

.head_revs

613

.head_revs

614

.read()

614

.read()

615

.expect("RwLock on Index.head_revs should not be poisoned");

615

.expect("RwLock on Index.head_revs should not be poisoned");

616

let self_head_revs = &guard.0;

616

let self_head_revs = &guard.0;

617

let self_filtered_revs = &guard.1;

617

let self_filtered_revs = &guard.1;

618

if !self_head_revs.is_empty()

618

if !self_head_revs.is_empty()

619

&& filtered_revs == self_filtered_revs

619

&& filtered_revs == self_filtered_revs

620

{

620

{

621

if py_shortcut {

621

if py_shortcut {

622

// Don't copy the revs since we've already cached them

622

// Don't copy the revs since we've already cached them

623

// on the Python side.

623

// on the Python side.

624

return Ok(None);

624

return Ok(None);

625

} else {

625

} else {

626

return Ok(Some(self_head_revs.to_owned()));

626

return Ok(Some(self_head_revs.to_owned()));

627

}

627

}

628

}

628

}

629

}

629

}

630

631

let as_vec = if self.is_empty() {

631

let as_vec = if self.is_empty() {

632

vec![NULL_REVISION]

632

vec![NULL_REVISION]

633

} else {

633

} else {

634

let mut not_heads = bitvec![0; self.len()];

634

let mut not_heads = bitvec![0; self.len()];

635

dagops::retain_heads_fast(

635

dagops::retain_heads_fast(

636

self,

636

self,

637

not_heads.as_mut_bitslice(),

637

not_heads.as_mut_bitslice(),

638

filtered_revs,

638

filtered_revs,

639

)?;

639

)?;

640

not_heads

640

not_heads

641

.into_iter()

641

.into_iter()

642

.enumerate()

642

.enumerate()

643

.filter_map(|(idx, is_not_head)| {

643

.filter_map(|(idx, is_not_head)| {

644

if is_not_head {

644

if is_not_head {

645

None

645

None

646

} else {

646

} else {

647

Some(Revision(idx as BaseRevision))

647

Some(Revision(idx as BaseRevision))

648

}

648

}

649

})

649

})

650

.collect()

650

.collect()

651

};

651

};

652

*self

652

*self

653

.head_revs

653

.head_revs

654

.write()

654

.write()

655

.expect("RwLock on Index.head_revs should not be poisoned") =

655

.expect("RwLock on Index.head_revs should not be poisoned") =

656

(as_vec.to_owned(), filtered_revs.to_owned());

656

(as_vec.to_owned(), filtered_revs.to_owned());

657

Ok(Some(as_vec))

657

Ok(Some(as_vec))

658

}

658

}

659

660

/// Obtain the delta chain for a revision.

660

/// Obtain the delta chain for a revision.

661

///

661

///

662

/// `stop_rev` specifies a revision to stop at. If not specified, we

662

/// `stop_rev` specifies a revision to stop at. If not specified, we

663

/// stop at the base of the chain.

663

/// stop at the base of the chain.

664

///

664

///

665

/// Returns a 2-tuple of (chain, stopped) where `chain` is a vec of

665

/// Returns a 2-tuple of (chain, stopped) where `chain` is a vec of

666

/// revs in ascending order and `stopped` is a bool indicating whether

666

/// revs in ascending order and `stopped` is a bool indicating whether

667

/// `stoprev` was hit.

667

/// `stoprev` was hit.

668

pub fn delta_chain(

668

pub fn delta_chain(

669

&self,

669

&self,

670

rev: Revision,

670

rev: Revision,

671

stop_rev: Option<Revision>,

671

stop_rev: Option<Revision>,

672

using_general_delta: Option<bool>,

672

using_general_delta: Option<bool>,

673

) -> Result<(Vec<Revision>, bool), HgError> {

673

) -> Result<(Vec<Revision>, bool), HgError> {

674

let mut current_rev = rev;

674

let mut current_rev = rev;

675

let mut entry = self.get_entry(rev).unwrap();

675

let mut entry = self.get_entry(rev).unwrap();

676

let mut chain = vec![];

676

let mut chain = vec![];

677

let using_general_delta =

677

let using_general_delta =

678

using_general_delta.unwrap_or_else(|| self.uses_generaldelta());

678

using_general_delta.unwrap_or_else(|| self.uses_generaldelta());

679

while current_rev.0 != entry.base_revision_or_base_of_delta_chain().0

679

while current_rev.0 != entry.base_revision_or_base_of_delta_chain().0

680

&& stop_rev.map(|r| r != current_rev).unwrap_or(true)

680

&& stop_rev.map(|r| r != current_rev).unwrap_or(true)

681

{

681

{

682

chain.push(current_rev);

682

chain.push(current_rev);

683

let new_rev = if using_general_delta {

683

let new_rev = if using_general_delta {

684

entry.base_revision_or_base_of_delta_chain()

684

entry.base_revision_or_base_of_delta_chain()

685

} else {

685

} else {

686

UncheckedRevision(current_rev.0 - 1)

686

UncheckedRevision(current_rev.0 - 1)

687

};

687

};

688

current_rev = self.check_revision(new_rev).ok_or_else(|| {

688

current_rev = self.check_revision(new_rev).ok_or_else(|| {

689

HgError::corrupted(format!("Revision {new_rev} out of range"))

689

HgError::corrupted(format!("Revision {new_rev} out of range"))

690

})?;

690

})?;

691

if current_rev.0 == NULL_REVISION.0 {

691

if current_rev.0 == NULL_REVISION.0 {

692

break;

692

break;

693

}

693

}

694

entry = self.get_entry(current_rev).unwrap()

694

entry = self.get_entry(current_rev).unwrap()

695

}

695

}

696

697

let stopped = if stop_rev.map(|r| current_rev == r).unwrap_or(false) {

697

let stopped = if stop_rev.map(|r| current_rev == r).unwrap_or(false) {

698

true

698

true

699

} else {

699

} else {

700

chain.push(current_rev);

700

chain.push(current_rev);

701

false

701

false

702

};

702

};

703

chain.reverse();

703

chain.reverse();

704

Ok((chain, stopped))

704

Ok((chain, stopped))

705

}

705

}

706

707

pub fn find_snapshots(

707

pub fn find_snapshots(

708

&self,

708

&self,

709

start_rev: UncheckedRevision,

709

start_rev: UncheckedRevision,

710

end_rev: UncheckedRevision,

710

end_rev: UncheckedRevision,

711

cache: &mut impl SnapshotsCache,

711

cache: &mut impl SnapshotsCache,

712

) -> Result<(), RevlogError> {

712

) -> Result<(), RevlogError> {

713

let mut start_rev = start_rev.0;

713

let mut start_rev = start_rev.0;

714

let mut end_rev = end_rev.0;

714

let mut end_rev = end_rev.0;

715

end_rev += 1;

715

end_rev += 1;

716

let len = self.len().try_into().unwrap();

716

let len = self.len().try_into().unwrap();

717

if end_rev > len {

717

if end_rev > len {

718

end_rev = len;

718

end_rev = len;

719

}

719

}

720

if start_rev < 0 {

720

if start_rev < 0 {

721

start_rev = 0;

721

start_rev = 0;

722

}

722

}

723

for rev in start_rev..end_rev {

723

for rev in start_rev..end_rev {

724

if !self.is_snapshot_unchecked(Revision(rev))? {

724

if !self.is_snapshot_unchecked(Revision(rev))? {

725

continue;

725

continue;

726

}

726

}

727

let mut base = self

727

let mut base = self

728

.get_entry(Revision(rev))

728

.get_entry(Revision(rev))

729

.unwrap()

729

.unwrap()

730

.base_revision_or_base_of_delta_chain();

730

.base_revision_or_base_of_delta_chain();

731

if base.0 == rev {

731

if base.0 == rev {

732

base = NULL_REVISION.into();

732

base = NULL_REVISION.into();

733

}

733

}

734

cache.insert_for(base.0, rev)?;

734

cache.insert_for(base.0, rev)?;

735

}

735

}

736

Ok(())

736

Ok(())

737

}

737

}

738

739

fn clear_head_revs(&self) {

739

fn clear_head_revs(&self) {

740

self.head_revs

740

self.head_revs

741

.write()

741

.write()

742

.expect("RwLock on Index.head_revs should not be poisoined")

742

.expect("RwLock on Index.head_revs should not be poisoined")

743

.0

743

.0

744

.clear()

744

.clear()

745

}

745

}

746

747

/// TODO move this to the trait probably, along with other things

747

/// TODO move this to the trait probably, along with other things

748

pub fn append(

748

pub fn append(

749

&mut self,

749

&mut self,

750

revision_data: RevisionDataParams,

750

revision_data: RevisionDataParams,

751

) -> Result<(), RevlogError> {

751

) -> Result<(), RevlogError> {

752

revision_data.validate()?;

752

revision_data.validate()?;

753

let entry_v1 = revision_data.into_v1();

753

let entry_v1 = revision_data.into_v1();

754

let entry_bytes = entry_v1.as_bytes();

754

let entry_bytes = entry_v1.as_bytes();

755

if self.bytes.len() == 0 {

755

if self.bytes.len() == 0 {

756

self.bytes.first_entry[INDEX_HEADER_SIZE..].copy_from_slice(

756

self.bytes.first_entry[INDEX_HEADER_SIZE..].copy_from_slice(

757

&entry_bytes[INDEX_HEADER_SIZE..INDEX_ENTRY_SIZE],

757

&entry_bytes[INDEX_HEADER_SIZE..INDEX_ENTRY_SIZE],

758

)

758

)

759

}

759

}

760

if self.is_inline() {

760

if self.is_inline() {

761

let new_offset = self.bytes.len();

761

let new_offset = self.bytes.len();

762

if let Some(offsets) = &mut *self.get_offsets_mut() {

762

if let Some(offsets) = &mut *self.get_offsets_mut() {

763

offsets.push(new_offset)

763

offsets.push(new_offset)

764

}

764

}

765

}

765

}

766

self.bytes.added.extend(entry_bytes);

766

self.bytes.added.extend(entry_bytes);

767

self.clear_head_revs();

767

self.clear_head_revs();

768

Ok(())

768

Ok(())

769

}

769

}

770

771

pub fn pack_header(&self, header: i32) -> [u8; 4] {

771

pub fn pack_header(&self, header: i32) -> [u8; 4] {

772

header.to_be_bytes()

772

header.to_be_bytes()

773

}

773

}

774

775

pub fn remove(&mut self, rev: Revision) -> Result<(), RevlogError> {

775

pub fn remove(&mut self, rev: Revision) -> Result<(), RevlogError> {

776

let offsets = if self.is_inline() {

776

let offsets = if self.is_inline() {

777

self.get_offsets().clone()

777

self.get_offsets().clone()

778

} else {

778

} else {

779

None

779

None

780

};

780

};

781

self.bytes.remove(rev, offsets.as_deref())?;

781

self.bytes.remove(rev, offsets.as_deref())?;

782

if self.is_inline() {

782

if self.is_inline() {

783

if let Some(offsets) = &mut *self.get_offsets_mut() {

783

if let Some(offsets) = &mut *self.get_offsets_mut() {

784

offsets.truncate(rev.0 as usize)

784

offsets.truncate(rev.0 as usize)

785

}

785

}

786

}

786

}

787

self.clear_head_revs();

787

self.clear_head_revs();

788

Ok(())

788

Ok(())

789

}

789

}

790

791

pub fn clear_caches(&self) {

791

pub fn clear_caches(&self) {

792

// We need to get the 'inline' value from Python at init and use this

792

// We need to get the 'inline' value from Python at init and use this

793

// instead of offsets to determine whether we're inline since we might

793

// instead of offsets to determine whether we're inline since we might

794

// clear caches. This implies re-populating the offsets on-demand.

794

// clear caches. This implies re-populating the offsets on-demand.

795

*self

795

*self

796

.offsets

796

.offsets

797

.write()

797

.write()

798

.expect("RwLock on Index.offsets should not be poisoed") = None;

798

.expect("RwLock on Index.offsets should not be poisoed") = None;

799

self.clear_head_revs();

799

self.clear_head_revs();

800

}

800

}

801

802

/// Unchecked version of `is_snapshot`.

802

/// Unchecked version of `is_snapshot`.

803

/// Assumes the caller checked that `rev` is within a valid revision range.

803

/// Assumes the caller checked that `rev` is within a valid revision range.

804

pub fn is_snapshot_unchecked(

804

pub fn is_snapshot_unchecked(

805

&self,

805

&self,

806

mut rev: Revision,

806

mut rev: Revision,

807

) -> Result<bool, RevlogError> {

807

) -> Result<bool, RevlogError> {

808

while rev.0 >= 0 {

808

while rev.0 >= 0 {

809

let entry = self.get_entry(rev).unwrap();

809

let entry = self.get_entry(rev).unwrap();

810

let mut base = entry.base_revision_or_base_of_delta_chain().0;

810

let mut base = entry.base_revision_or_base_of_delta_chain().0;

811

if base == rev.0 {

811

if base == rev.0 {

812

base = NULL_REVISION.0;

812

base = NULL_REVISION.0;

813

}

813

}

814

if base == NULL_REVISION.0 {

814

if base == NULL_REVISION.0 {

815

return Ok(true);

815

return Ok(true);

816

}

816

}

817

let [mut p1, mut p2] = self

817

let [mut p1, mut p2] = self

818

.parents(rev)

818

.parents(rev)

819

.map_err(|_| RevlogError::InvalidRevision)?;

819

.map_err(|_| RevlogError::InvalidRevision)?;

820

while let Some(p1_entry) = self.get_entry(p1) {

820

while let Some(p1_entry) = self.get_entry(p1) {

821

if p1_entry.compressed_len() != 0 || p1.0 == 0 {

821

if p1_entry.compressed_len() != 0 || p1.0 == 0 {

822

break;

822

break;

823

}

823

}

824

let parent_base =

824

let parent_base =

825

p1_entry.base_revision_or_base_of_delta_chain();

825

p1_entry.base_revision_or_base_of_delta_chain();

826

if parent_base.0 == p1.0 {

826

if parent_base.0 == p1.0 {

827

break;

827

break;

828

}

828

}

829

p1 = self

829

p1 = self

830

.check_revision(parent_base)

830

.check_revision(parent_base)

831

.ok_or(RevlogError::InvalidRevision)?;

831

.ok_or(RevlogError::InvalidRevision)?;

832

}

832

}

833

while let Some(p2_entry) = self.get_entry(p2) {

833

while let Some(p2_entry) = self.get_entry(p2) {

834

if p2_entry.compressed_len() != 0 || p2.0 == 0 {

834

if p2_entry.compressed_len() != 0 || p2.0 == 0 {

835

break;

835

break;

836

}

836

}

837

let parent_base =

837

let parent_base =

838

p2_entry.base_revision_or_base_of_delta_chain();

838

p2_entry.base_revision_or_base_of_delta_chain();

839

if parent_base.0 == p2.0 {

839

if parent_base.0 == p2.0 {

840

break;

840

break;

841

}

841

}

842

p2 = self

842

p2 = self

843

.check_revision(parent_base)

843

.check_revision(parent_base)

844

.ok_or(RevlogError::InvalidRevision)?;

844

.ok_or(RevlogError::InvalidRevision)?;

845

}

845

}

846

if base == p1.0 || base == p2.0 {

846

if base == p1.0 || base == p2.0 {

847

return Ok(false);

847

return Ok(false);

848

}

848

}

849

rev = self

849

rev = self

850

.check_revision(base.into())

850

.check_revision(base.into())

851

.ok_or(RevlogError::InvalidRevision)?;

851

.ok_or(RevlogError::InvalidRevision)?;

852

}

852

}

853

Ok(rev == NULL_REVISION)

853

Ok(rev == NULL_REVISION)

854

}

854

}

855

856

/// Return whether the given revision is a snapshot. Returns an error if

856

/// Return whether the given revision is a snapshot. Returns an error if

857

/// `rev` is not within a valid revision range.

857

/// `rev` is not within a valid revision range.

858

pub fn is_snapshot(

858

pub fn is_snapshot(

859

&self,

859

&self,

860

rev: UncheckedRevision,

860

rev: UncheckedRevision,

861

) -> Result<bool, RevlogError> {

861

) -> Result<bool, RevlogError> {

862

let rev = self

862

let rev = self

863

.check_revision(rev)

863

.check_revision(rev)

864

.ok_or_else(|| RevlogError::corrupted("test"))?;

864

.ok_or_else(|| RevlogError::corrupted("test"))?;

865

self.is_snapshot_unchecked(rev)

865

self.is_snapshot_unchecked(rev)

866

}

866

}

867

868

/// Slice revs to reduce the amount of unrelated data to be read from disk.

868

/// Slice revs to reduce the amount of unrelated data to be read from disk.

869

///

869

///

870

/// The index is sliced into groups that should be read in one time.

870

/// The index is sliced into groups that should be read in one time.

871

///

871

///

872

/// The initial chunk is sliced until the overall density

872

/// The initial chunk is sliced until the overall density

873

/// (payload/chunks-span ratio) is above `target_density`.

873

/// (payload/chunks-span ratio) is above `target_density`.

874

/// No gap smaller than `min_gap_size` is skipped.

874

/// No gap smaller than `min_gap_size` is skipped.

875

pub fn slice_chunk_to_density(

875

pub fn slice_chunk_to_density(

876

&self,

876

&self,

877

revs: &[Revision],

877

revs: &[Revision],

878

target_density: f64,

878

target_density: f64,

879

min_gap_size: usize,

879

min_gap_size: usize,

880

) -> Vec<Vec<Revision>> {

880

) -> Vec<Vec<Revision>> {

881

if revs.is_empty() {

881

if revs.is_empty() {

882

return vec![];

882

return vec![];

883

}

883

}

884

if revs.len() == 1 {

884

if revs.len() == 1 {

885

return vec![revs.to_owned()];

885

return vec![revs.to_owned()];

886

}

886

}

887

let delta_chain_span = self.segment_span(revs);

887

let delta_chain_span = self.segment_span(revs);

888

if delta_chain_span < min_gap_size {

888

if delta_chain_span < min_gap_size {

889

return vec![revs.to_owned()];

889

return vec![revs.to_owned()];

890

}

890

}

891

let entries: Vec<_> = revs

891

let entries: Vec<_> = revs

892

.iter()

892

.iter()

893

.map(|r| {

893

.map(|r| {

894

(*r, self.get_entry(*r).unwrap_or_else(|| self.null_entry()))

894

(*r, self.get_entry(*r).unwrap_or_else(|| self.null_entry()))

895

})

895

})

896

.collect();

896

.collect();

897

898

let mut read_data = delta_chain_span;

898

let mut read_data = delta_chain_span;

899

let chain_payload: u32 =

899

let chain_payload: u32 =

900

entries.iter().map(|(_r, e)| e.compressed_len()).sum();

900

entries.iter().map(|(_r, e)| e.compressed_len()).sum();

901

let mut density = if delta_chain_span > 0 {

901

let mut density = if delta_chain_span > 0 {

902

chain_payload as f64 / delta_chain_span as f64

902

chain_payload as f64 / delta_chain_span as f64

903

} else {

903

} else {

904

1.0

904

1.0

905

};

905

};

906

907

if density >= target_density {

907

if density >= target_density {

908

return vec![revs.to_owned()];

908

return vec![revs.to_owned()];

909

}

909

}

910

911

// Store the gaps in a heap to have them sorted by decreasing size

911

// Store the gaps in a heap to have them sorted by decreasing size

912

let mut gaps = Vec::new();

912

let mut gaps = Vec::new();

913

let mut previous_end = None;

913

let mut previous_end = None;

914

915

for (i, (_rev, entry)) in entries.iter().enumerate() {

915

for (i, (_rev, entry)) in entries.iter().enumerate() {

916

let start = entry.c_start() as usize;

916

let start = entry.c_start() as usize;

917

let length = entry.compressed_len();

917

let length = entry.compressed_len();

918

919

// Skip empty revisions to form larger holes

919

// Skip empty revisions to form larger holes

920

if length == 0 {

920

if length == 0 {

921

continue;

921

continue;

922

}

922

}

923

924

if let Some(end) = previous_end {

924

if let Some(end) = previous_end {

925

let gap_size = start - end;

925

let gap_size = start - end;

926

// Only consider holes that are large enough

926

// Only consider holes that are large enough

927

if gap_size > min_gap_size {

927

if gap_size > min_gap_size {

928

gaps.push((gap_size, i));

928

gaps.push((gap_size, i));

929

}

929

}

930

}

930

}

931

previous_end = Some(start + length as usize);

931

previous_end = Some(start + length as usize);

932

}

932

}

933

if gaps.is_empty() {

933

if gaps.is_empty() {

934

return vec![revs.to_owned()];

934

return vec![revs.to_owned()];

935

}

935

}

936

// sort the gaps to pop them from largest to small

936

// sort the gaps to pop them from largest to small

937

gaps.sort_unstable();

937

gaps.sort_unstable();

938

939

// Collect the indices of the largest holes until

939

// Collect the indices of the largest holes until

940

// the density is acceptable

940

// the density is acceptable

941

let mut selected = vec![];

941

let mut selected = vec![];

942

while let Some((gap_size, gap_id)) = gaps.pop() {

942

while let Some((gap_size, gap_id)) = gaps.pop() {

943

if density >= target_density {

943

if density >= target_density {

944

break;

944

break;

945

}

945

}

946

selected.push(gap_id);

946

selected.push(gap_id);

947

948

// The gap sizes are stored as negatives to be sorted decreasingly

948

// The gap sizes are stored as negatives to be sorted decreasingly

949

// by the heap

949

// by the heap

950

read_data -= gap_size;

950

read_data -= gap_size;

951

density = if read_data > 0 {

951

density = if read_data > 0 {

952

chain_payload as f64 / read_data as f64

952

chain_payload as f64 / read_data as f64

953

} else {

953

} else {

954

1.0

954

1.0

955

};

955

};

956

if density >= target_density {

956

if density >= target_density {

957

break;

957

break;

958

}

958

}

959

}

959

}

960

selected.sort_unstable();

960

selected.sort_unstable();

961

selected.push(revs.len());

961

selected.push(revs.len());

962

963

// Cut the revs at collected indices

963

// Cut the revs at collected indices

964

let mut previous_idx = 0;

964

let mut previous_idx = 0;

965

let mut chunks = vec![];

965

let mut chunks = vec![];

966

for idx in selected {

966

for idx in selected {

967

let chunk = self.trim_chunk(&entries, previous_idx, idx);

967

let chunk = self.trim_chunk(&entries, previous_idx, idx);

968

if !chunk.is_empty() {

968

if !chunk.is_empty() {

969

chunks.push(chunk.iter().map(|(rev, _entry)| *rev).collect());

969

chunks.push(chunk.iter().map(|(rev, _entry)| *rev).collect());

970

}

970

}

971

previous_idx = idx;

971

previous_idx = idx;

972

}

972

}

973

let chunk = self.trim_chunk(&entries, previous_idx, entries.len());

973

let chunk = self.trim_chunk(&entries, previous_idx, entries.len());

974

if !chunk.is_empty() {

974

if !chunk.is_empty() {

975

chunks.push(chunk.iter().map(|(rev, _entry)| *rev).collect());

975

chunks.push(chunk.iter().map(|(rev, _entry)| *rev).collect());

976

}

976

}

977

978

chunks

978

chunks

979

}

979

}

980

981

/// Get the byte span of a segment of sorted revisions.

981

/// Get the byte span of a segment of sorted revisions.

982

///

982

///

983

/// Occurrences of [`NULL_REVISION`] are ignored at the beginning of

983

/// Occurrences of [`NULL_REVISION`] are ignored at the beginning of

984

/// the `revs` segment.

984

/// the `revs` segment.

985

///

985

///

986

/// panics:

986

/// panics:

987

/// - if `revs` is empty or only made of `NULL_REVISION`

987

/// - if `revs` is empty or only made of `NULL_REVISION`

988

/// - if cannot retrieve entry for the last or first not null element of

988

/// - if cannot retrieve entry for the last or first not null element of

989

/// `revs`.

989

/// `revs`.

990

fn segment_span(&self, revs: &[Revision]) -> usize {

990

fn segment_span(&self, revs: &[Revision]) -> usize {

991

if revs.is_empty() {

991

if revs.is_empty() {

992

return 0;

992

return 0;

993

}

993

}

994

let last_entry = &self.get_entry(revs[revs.len() - 1]).unwrap();

994

let last_entry = &self.get_entry(revs[revs.len() - 1]).unwrap();

995

let end = last_entry.c_start() + last_entry.compressed_len() as u64;

995

let end = last_entry.c_start() + last_entry.compressed_len() as u64;

996

let first_rev = revs.iter().find(|r| r.0 != NULL_REVISION.0).unwrap();

996

let first_rev = revs.iter().find(|r| r.0 != NULL_REVISION.0).unwrap();

997

let start = if first_rev.0 == 0 {

997

let start = if first_rev.0 == 0 {

998

0

998

0

999

} else {

999

} else {

1000

self.get_entry(*first_rev).unwrap().c_start()

1000

self.get_entry(*first_rev).unwrap().c_start()

1001

};

1001

};

1002

(end - start) as usize

1002

(end - start) as usize

1003

}

1003

}

1004

1005

/// Returns `&revs[startidx..endidx]` without empty trailing revs

1005

/// Returns `&revs[startidx..endidx]` without empty trailing revs

1006

fn trim_chunk<'a>(

1006

fn trim_chunk<'a>(

1007

&'a self,

1007

&'a self,

1008

revs: &'a [(Revision, IndexEntry)],

1008

revs: &'a [(Revision, IndexEntry)],

1009

start: usize,

1009

start: usize,

1010

mut end: usize,

1010

mut end: usize,

1011

) -> &'a [(Revision, IndexEntry)] {

1011

) -> &'a [(Revision, IndexEntry)] {

1012

// Trim empty revs at the end, except the very first rev of a chain

1012

// Trim empty revs at the end, except the very first rev of a chain

1013

let last_rev = revs[end - 1].0;

1013

let last_rev = revs[end - 1].0;

1014

if last_rev.0 < self.len() as BaseRevision {

1014

if last_rev.0 < self.len() as BaseRevision {

1015

while end > 1

1015

while end > 1

1016

&& end > start

1016

&& end > start

1017

&& revs[end - 1].1.compressed_len() == 0

1017

&& revs[end - 1].1.compressed_len() == 0

1018

{

1018

{

1019

end -= 1

1019

end -= 1

1020

}

1020

}

1021

}

1021

}

1022

&revs[start..end]

1022

&revs[start..end]

1023

}

1023

}

1024

1025

/// Computes the set of revisions for each non-public phase from `roots`,

1025

/// Computes the set of revisions for each non-public phase from `roots`,

1026

/// which are the last known roots for each non-public phase.

1026

/// which are the last known roots for each non-public phase.

1027

pub fn compute_phases_map_sets(

1027

pub fn compute_phases_map_sets(

1028

&self,

1028

&self,

1029

roots: HashMap<Phase, Vec<Revision>>,

1029

roots: HashMap<Phase, Vec<Revision>>,

1030

) -> Result<(usize, RootsPerPhase), GraphError> {

1030

) -> Result<(usize, RootsPerPhase), GraphError> {

1031

let mut phases = vec![Phase::Public; self.len()];

1031

let mut phases = vec![Phase::Public; self.len()];

1032

let mut min_phase_rev = NULL_REVISION;

1032

let mut min_phase_rev = NULL_REVISION;

1033

1034

for phase in Phase::non_public_phases() {

1034

for phase in Phase::non_public_phases() {

1035

if let Some(phase_roots) = roots.get(phase) {

1035

if let Some(phase_roots) = roots.get(phase) {

1036

let min_rev =

1036

let min_rev =

1037

self.add_roots_get_min(phase_roots, &mut phases, *phase);

1037

self.add_roots_get_min(phase_roots, &mut phases, *phase);

1038

if min_rev != NULL_REVISION

1038

if min_rev != NULL_REVISION

1039

&& (min_phase_rev == NULL_REVISION

1039

&& (min_phase_rev == NULL_REVISION

1040

|| min_rev < min_phase_rev)

1040

|| min_rev < min_phase_rev)

1041

{

1041

{

1042

min_phase_rev = min_rev;

1042

min_phase_rev = min_rev;

1043

}

1043

}

1044

} else {

1044

} else {

1045

continue;

1045

continue;

1046

};

1046

};

1047

}

1047

}

1048

let mut phase_sets: RootsPerPhase = Default::default();

1048

let mut phase_sets: RootsPerPhase = Default::default();

1049

1050

if min_phase_rev == NULL_REVISION {

1050

if min_phase_rev == NULL_REVISION {

1051

min_phase_rev = Revision(self.len() as BaseRevision);

1051

min_phase_rev = Revision(self.len() as BaseRevision);

1052

}

1052

}

1053

1054

for rev in min_phase_rev.0..self.len() as BaseRevision {

1054

for rev in min_phase_rev.0..self.len() as BaseRevision {

1055

let rev = Revision(rev);

1055

let rev = Revision(rev);

1056

let [p1, p2] = self.parents(rev)?;

1056

let [p1, p2] = self.parents(rev)?;

1057

1058

if p1.0 >= 0 && phases[p1.0 as usize] > phases[rev.0 as usize] {

1058

if p1.0 >= 0 && phases[p1.0 as usize] > phases[rev.0 as usize] {

1059

phases[rev.0 as usize] = phases[p1.0 as usize];

1059

phases[rev.0 as usize] = phases[p1.0 as usize];

1060

}

1060

}

1061

if p2.0 >= 0 && phases[p2.0 as usize] > phases[rev.0 as usize] {

1061

if p2.0 >= 0 && phases[p2.0 as usize] > phases[rev.0 as usize] {

1062

phases[rev.0 as usize] = phases[p2.0 as usize];

1062

phases[rev.0 as usize] = phases[p2.0 as usize];

1063

}

1063

}

1064

let set = match phases[rev.0 as usize] {

1064

let set = match phases[rev.0 as usize] {

1065

Phase::Public => continue,

1065

Phase::Public => continue,

1066

phase => &mut phase_sets[phase as usize - 1],

1066

phase => &mut phase_sets[phase as usize - 1],

1067

};

1067

};

1068

set.push(rev);

1068

set.push(rev);

1069

}

1069

}

1070

1071

Ok((self.len(), phase_sets))

1071

Ok((self.len(), phase_sets))

1072

}

1072

}

1073

1074

fn add_roots_get_min(

1074

fn add_roots_get_min(

1075

&self,

1075

&self,

1076

phase_roots: &[Revision],

1076

phase_roots: &[Revision],

1077

phases: &mut [Phase],

1077

phases: &mut [Phase],

1078

phase: Phase,

1078

phase: Phase,

1079

) -> Revision {

1079

) -> Revision {

1080

let mut min_rev = NULL_REVISION;

1080

let mut min_rev = NULL_REVISION;

1081

1082

for root in phase_roots {

1082

for root in phase_roots {

1083

phases[root.0 as usize] = phase;

1083

phases[root.0 as usize] = phase;

1084

if min_rev == NULL_REVISION || min_rev > *root {

1084

if min_rev == NULL_REVISION || min_rev > *root {

1085

min_rev = *root;

1085

min_rev = *root;

1086

}

1086

}

1087

}

1087

}

1088

min_rev

1088

min_rev

1089

}

1089

}

1090

1091

/// Return `(heads(::(<roots> and <roots>::<heads>)))`

1091

/// Return `(heads(::(<roots> and <roots>::<heads>)))`

1092

/// If `include_path` is `true`, return `(<roots>::<heads>)`."""

1092

/// If `include_path` is `true`, return `(<roots>::<heads>)`."""

1093

///

1093

///

1094

/// `min_root` and `roots` are unchecked since they are just used as

1094

/// `min_root` and `roots` are unchecked since they are just used as

1095

/// a bound or for comparison and don't need to represent a valid revision.

1095

/// a bound or for comparison and don't need to represent a valid revision.

1096

/// In practice, the only invalid revision passed is the working directory

1096

/// In practice, the only invalid revision passed is the working directory

1097

/// revision ([`i32::MAX`]).

1097

/// revision ([`i32::MAX`]).

1098

pub fn reachable_roots(

1098

pub fn reachable_roots(

1099

&self,

1099

&self,

1100

min_root: UncheckedRevision,

1100

min_root: UncheckedRevision,

1101

mut heads: Vec<Revision>,

1101

mut heads: Vec<Revision>,

1102

roots: HashSet<UncheckedRevision>,

1102

roots: HashSet<UncheckedRevision>,

1103

include_path: bool,

1103

include_path: bool,

1104

) -> Result<HashSet<Revision>, GraphError> {

1104

) -> Result<HashSet<Revision>, GraphError> {

1105

if roots.is_empty() {

1105

if roots.is_empty() {

1106

return Ok(HashSet::new());

1106

return Ok(HashSet::new());

1107

}

1107

}

1108

let mut reachable = HashSet::new();

1108

let mut reachable = HashSet::new();

1109

let mut seen = HashMap::new();

1109

let mut seen = HashMap::new();

1110

1111

while let Some(rev) = heads.pop() {

1111

while let Some(rev) = heads.pop() {

1112

if roots.contains(&rev.into()) {

1112

if roots.contains(&rev.into()) {

1113

reachable.insert(rev);

1113

reachable.insert(rev);

1114

if !include_path {

1114

if !include_path {

1115

continue;

1115

continue;

1116

}

1116

}

1117

}

1117

}

1118

let parents = self.parents(rev)?;

1118

let parents = self.parents(rev)?;

1119

seen.insert(rev, parents);

1119

seen.insert(rev, parents);

1120

for parent in parents {

1120

for parent in parents {

1121

if parent.0 >= min_root.0 && !seen.contains_key(&parent) {

1121

if parent.0 >= min_root.0 && !seen.contains_key(&parent) {

1122

heads.push(parent);

1122

heads.push(parent);

1123

}

1123

}

1124

}

1124

}

1125

}

1125

}

1126

if !include_path {

1126

if !include_path {

1127

return Ok(reachable);

1127

return Ok(reachable);

1128

}

1128

}

1129

let mut revs: Vec<_> = seen.keys().collect();

1129

let mut revs: Vec<_> = seen.keys().collect();

1130

revs.sort_unstable();

1130

revs.sort_unstable();

1131

for rev in revs {

1131

for rev in revs {

1132

for parent in seen[rev] {

1132

for parent in seen[rev] {

1133

if reachable.contains(&parent) {

1133

if reachable.contains(&parent) {

1134

reachable.insert(*rev);

1134

reachable.insert(*rev);

1135

}

1135

}

1136

}

1136

}

1137

}

1137

}

1138

Ok(reachable)

1138

Ok(reachable)

1139

}

1139

}

1140

1141

/// Given a (possibly overlapping) set of revs, return all the

1141

/// Given a (possibly overlapping) set of revs, return all the

1142

/// common ancestors heads: `heads(::args[0] and ::a[1] and ...)`

1142

/// common ancestors heads: `heads(::args[0] and ::a[1] and ...)`

1143

pub fn common_ancestor_heads(

1143

pub fn common_ancestor_heads(

1144

&self,

1144

&self,

1145

revisions: &[Revision],

1145

revisions: &[Revision],

1146

) -> Result<Vec<Revision>, GraphError> {

1146

) -> Result<Vec<Revision>, GraphError> {

1147

// given that revisions is expected to be small, we find this shortcut

1147

// given that revisions is expected to be small, we find this shortcut

1148

// potentially acceptable, especially given that `hg-cpython` could

1148

// potentially acceptable, especially given that `hg-cpython` could

1149

// very much bypass this, constructing a vector of unique values from

1149

// very much bypass this, constructing a vector of unique values from

1150

// the onset.

1150

// the onset.

1151

let as_set: HashSet<Revision> = revisions.iter().copied().collect();

1151

let as_set: HashSet<Revision> = revisions.iter().copied().collect();

1152

// Besides deduplicating, the C version also implements the shortcut

1152

// Besides deduplicating, the C version also implements the shortcut

1153

// for `NULL_REVISION`:

1153

// for `NULL_REVISION`:

1154

if as_set.contains(&NULL_REVISION) {

1154

if as_set.contains(&NULL_REVISION) {

1155

return Ok(vec![]);

1155

return Ok(vec![]);

1156

}

1156

}

1157

1158

let revisions: Vec<Revision> = as_set.into_iter().collect();

1158

let revisions: Vec<Revision> = as_set.into_iter().collect();

1159

1160

if revisions.len() < 8 {

1160

if revisions.len() < 8 {

1161

self.find_gca_candidates::<u8>(&revisions)

1161

self.find_gca_candidates::<u8>(&revisions)

1162

} else if revisions.len() < 64 {

1162

} else if revisions.len() < 64 {

1163

self.find_gca_candidates::<u64>(&revisions)

1163

self.find_gca_candidates::<u64>(&revisions)

1164

} else {

1164

} else {

1165

self.find_gca_candidates::<NonStaticPoisonableBitSet>(&revisions)

1165

self.find_gca_candidates::<NonStaticPoisonableBitSet>(&revisions)

1166

}

1166

}

1167

}

1167

}

1168

1169

pub fn ancestors(

1169

pub fn ancestors(

1170

&self,

1170

&self,

1171

revisions: &[Revision],

1171

revisions: &[Revision],

1172

) -> Result<Vec<Revision>, GraphError> {

1172

) -> Result<Vec<Revision>, GraphError> {

1173

self.find_deepest_revs(&self.common_ancestor_heads(revisions)?)

1173

self.find_deepest_revs(&self.common_ancestor_heads(revisions)?)

1174

}

1174

}

1175

1176

/// Given a disjoint set of revs, return all candidates for the

1176

/// Given a disjoint set of revs, return all candidates for the

1177

/// greatest common ancestor. In revset notation, this is the set

1177

/// greatest common ancestor. In revset notation, this is the set

1178

/// `heads(::a and ::b and ...)`

1178

/// `heads(::a and ::b and ...)`

1179

fn find_gca_candidates<BS: PoisonableBitSet + Clone>(

1179

fn find_gca_candidates<BS: PoisonableBitSet + Clone>(

1180

&self,

1180

&self,

1181

revs: &[Revision],

1181

revs: &[Revision],

1182

) -> Result<Vec<Revision>, GraphError> {

1182

) -> Result<Vec<Revision>, GraphError> {

1183

if revs.is_empty() {

1183

if revs.is_empty() {

1184

return Ok(vec![]);

1184

return Ok(vec![]);

1185

}

1185

}

1186

let revcount = revs.len();

1186

let revcount = revs.len();

1187

let mut candidates = vec![];

1187

let mut candidates = vec![];

1188

let max_rev = revs.iter().max().unwrap();

1188

let max_rev = revs.iter().max().unwrap();

1189

1190

let mut seen = BS::vec_of_empty(revs.len(), (max_rev.0 + 1) as usize);

1190

let mut seen = BS::vec_of_empty(revs.len(), (max_rev.0 + 1) as usize);

1191

1192

for (idx, rev) in revs.iter().enumerate() {

1192

for (idx, rev) in revs.iter().enumerate() {

1193

seen[rev.0 as usize].add(idx);

1193

seen[rev.0 as usize].add(idx);

1194

}

1194

}

1195

let mut current_rev = *max_rev;

1195

let mut current_rev = *max_rev;

1196

// Number of revisions whose inspection in the main loop

1196

// Number of revisions whose inspection in the main loop

1197

// will give a result or trigger inspection of other revisions

1197

// will give a result or trigger inspection of other revisions

1198

let mut interesting = revcount;

1198

let mut interesting = revcount;

1199

1200

// The algorithm works on a vector of bit sets, indexed by revision

1200

// The algorithm works on a vector of bit sets, indexed by revision

1201

// numbers and iterated on reverse order.

1201

// numbers and iterated on reverse order.

1202

// An entry in this vector is poisoned if and only if the corresponding

1202

// An entry in this vector is poisoned if and only if the corresponding

1203

// revision is a common, yet not maximal ancestor.

1203

// revision is a common, yet not maximal ancestor.

1204

1205

// The principle of the algorithm is as follows:

1205

// The principle of the algorithm is as follows:

1206

// For a revision `r`, when entering the loop, `seen[r]` is either

1206

// For a revision `r`, when entering the loop, `seen[r]` is either

1207

// poisoned or the sub set of `revs` of which `r` is an ancestor.

1207

// poisoned or the sub set of `revs` of which `r` is an ancestor.

1208

// In this sub set is full, then `r` is a solution and its parents

1208

// In this sub set is full, then `r` is a solution and its parents

1209

// have to be poisoned.

1209

// have to be poisoned.

1210

//

1210

//

1211

// At each iteration, the bit sets of the parents are updated by

1211

// At each iteration, the bit sets of the parents are updated by

1212

// union with `seen[r]`.

1212

// union with `seen[r]`.

1213

// As we walk the index from the end, we are sure we have encountered

1213

// As we walk the index from the end, we are sure we have encountered

1214

// all children of `r` before `r`, hence we know that `seen[r]` is

1214

// all children of `r` before `r`, hence we know that `seen[r]` is

1215

// fully computed.

1215

// fully computed.

1216

//

1216

//

1217

// On top of that there are several optimizations that make reading

1217

// On top of that there are several optimizations that make reading

1218

// less obvious than the comment above:

1218

// less obvious than the comment above:

1219

// - The `interesting` counter allows to break early

1219

// - The `interesting` counter allows to break early

1220

// - The loop starts from `max(revs)`

1220

// - The loop starts from `max(revs)`

1221

// - Early return in case it is detected that one of the incoming revs

1221

// - Early return in case it is detected that one of the incoming revs

1222

// is a common ancestor of all of them.

1222

// is a common ancestor of all of them.

1223

while current_rev.0 >= 0 && interesting > 0 {

1223

while current_rev.0 >= 0 && interesting > 0 {

1224

let current_seen = seen[current_rev.0 as usize].clone();

1224

let current_seen = seen[current_rev.0 as usize].clone();

1225

1226

if current_seen.is_empty() {

1226

if current_seen.is_empty() {

1227

current_rev = Revision(current_rev.0 - 1);

1227

current_rev = Revision(current_rev.0 - 1);

1228

continue;

1228

continue;

1229

}

1229

}

1230

let mut poison = current_seen.is_poisoned();

1230

let mut poison = current_seen.is_poisoned();

1231

if !poison {

1231

if !poison {

1232

interesting -= 1;

1232

interesting -= 1;

1233

if current_seen.is_full_range(revcount) {

1233

if current_seen.is_full_range(revcount) {

1234

candidates.push(current_rev);

1234

candidates.push(current_rev);

1235

poison = true;

1235

poison = true;

1236

1237

// Being a common ancestor, if `current_rev` is among

1237

// Being a common ancestor, if `current_rev` is among

1238

// the input revisions, it is *the* answer.

1238

// the input revisions, it is *the* answer.

1239

for rev in revs {

1239

for rev in revs {

1240

if *rev == current_rev {

1240

if *rev == current_rev {

1241

return Ok(candidates);

1241

return Ok(candidates);

1242

}

1242

}

1243

}

1243

}

1244

}

1244

}

1245

}

1245

}

1246

for parent in self.parents(current_rev)? {

1246

for parent in self.parents(current_rev)? {

1247

if parent == NULL_REVISION {

1247

if parent == NULL_REVISION {

1248

continue;

1248

continue;

1249

}

1249

}

1250

let parent_seen = &mut seen[parent.0 as usize];

1250

let parent_seen = &mut seen[parent.0 as usize];

1251

if poison {

1251

if poison {

1252

// this block is logically equivalent to poisoning parent

1252

// this block is logically equivalent to poisoning parent

1253

// and counting it as non interesting if it

1253

// and counting it as non interesting if it

1254

// has been seen before (hence counted then as interesting)

1254

// has been seen before (hence counted then as interesting)

1255

if !parent_seen.is_empty() && !parent_seen.is_poisoned() {

1255

if !parent_seen.is_empty() && !parent_seen.is_poisoned() {

1256

interesting -= 1;

1256

interesting -= 1;

1257

}

1257

}

1258

parent_seen.poison();

1258

parent_seen.poison();

1259

} else {

1259

} else {

1260

if parent_seen.is_empty() {

1260

if parent_seen.is_empty() {

1261

interesting += 1;

1261

interesting += 1;

1262

}

1262

}

1263

parent_seen.union(&current_seen);

1263

parent_seen.union(&current_seen);

1264

}

1264

}

1265

}

1265

}

1266

1267

current_rev = Revision(current_rev.0 - 1);

1267

current_rev = Revision(current_rev.0 - 1);

1268

}

1268

}

1269

1270

Ok(candidates)

1270

Ok(candidates)

1271

}

1271

}

1272

1273

/// Given a disjoint set of revs, return the subset with the longest path

1273

/// Given a disjoint set of revs, return the subset with the longest path

1274

/// to the root.

1274

/// to the root.

1275

fn find_deepest_revs(

1275

fn find_deepest_revs(

1276

&self,

1276

&self,

1277

revs: &[Revision],

1277

revs: &[Revision],

1278

) -> Result<Vec<Revision>, GraphError> {

1278

) -> Result<Vec<Revision>, GraphError> {

1279

// TODO replace this all with just comparing rank?

1279

// TODO replace this all with just comparing rank?

1280

// Also, the original implementations in C/Python are cryptic, not

1280

// Also, the original implementations in C/Python are cryptic, not

1281

// even sure we actually need this?

1281

// even sure we actually need this?

1282

if revs.len() <= 1 {

1282

if revs.len() <= 1 {

1283

return Ok(revs.to_owned());

1283

return Ok(revs.to_owned());

1284

}

1284

}

1285

let max_rev = revs.iter().max().unwrap().0;

1285

let max_rev = revs.iter().max().unwrap().0;

1286

let mut interesting = HashMap::new();

1286

let mut interesting = HashMap::new();

1287

let mut seen = vec![0; max_rev as usize + 1];

1287

let mut seen = vec![0; max_rev as usize + 1];

1288

let mut depth = vec![0; max_rev as usize + 1];

1288

let mut depth = vec![0; max_rev as usize + 1];

1289

let mut mapping = vec![];

1289

let mut mapping = vec![];

1290

let mut revs = revs.to_owned();

1290

let mut revs = revs.to_owned();

1291

revs.sort_unstable();

1291

revs.sort_unstable();

1292

1293

for (idx, rev) in revs.iter().enumerate() {

1293

for (idx, rev) in revs.iter().enumerate() {

1294

depth[rev.0 as usize] = 1;

1294

depth[rev.0 as usize] = 1;

1295

let shift = 1 << idx;

1295

let shift = 1 << idx;

1296

seen[rev.0 as usize] = shift;

1296

seen[rev.0 as usize] = shift;

1297

interesting.insert(shift, 1);

1297

interesting.insert(shift, 1);

1298

mapping.push((shift, *rev));

1298

mapping.push((shift, *rev));

1299

}

1299

}

1300

1301

let mut current_rev = Revision(max_rev);

1301

let mut current_rev = Revision(max_rev);

1302

while current_rev.0 >= 0 && interesting.len() > 1 {

1302

while current_rev.0 >= 0 && interesting.len() > 1 {

1303

let current_depth = depth[current_rev.0 as usize];

1303

let current_depth = depth[current_rev.0 as usize];

1304

if current_depth == 0 {

1304

if current_depth == 0 {

1305

current_rev = Revision(current_rev.0 - 1);

1305

current_rev = Revision(current_rev.0 - 1);

1306

continue;

1306

continue;

1307

}

1307

}

1308

1309

let current_seen = seen[current_rev.0 as usize];

1309

let current_seen = seen[current_rev.0 as usize];

1310

for parent in self.parents(current_rev)? {

1310

for parent in self.parents(current_rev)? {

1311

if parent == NULL_REVISION {

1311

if parent == NULL_REVISION {

1312

continue;

1312

continue;

1313

}

1313

}

1314

let parent_seen = seen[parent.0 as usize];

1314

let parent_seen = seen[parent.0 as usize];

1315

let parent_depth = depth[parent.0 as usize];

1315

let parent_depth = depth[parent.0 as usize];

1316

if parent_depth <= current_depth {

1316

if parent_depth <= current_depth {

1317

depth[parent.0 as usize] = current_depth + 1;

1317

depth[parent.0 as usize] = current_depth + 1;

1318

if parent_seen != current_seen {

1318

if parent_seen != current_seen {

1319

*interesting.get_mut(&current_seen).unwrap() += 1;

1319

*interesting.get_mut(&current_seen).unwrap() += 1;

1320

seen[parent.0 as usize] = current_seen;

1320

seen[parent.0 as usize] = current_seen;

1321

if parent_seen != 0 {

1321

if parent_seen != 0 {

1322

let parent_interesting =

1322

let parent_interesting =

1323

interesting.get_mut(&parent_seen).unwrap();

1323

interesting.get_mut(&parent_seen).unwrap();

1324

*parent_interesting -= 1;

1324

*parent_interesting -= 1;

1325

if *parent_interesting == 0 {

1325

if *parent_interesting == 0 {

1326

interesting.remove(&parent_seen);

1326

interesting.remove(&parent_seen);

1327

}

1327

}

1328

}

1328

}

1329

}

1329

}

1330

} else if current_depth == parent_depth - 1 {

1330

} else if current_depth == parent_depth - 1 {

1331

let either_seen = parent_seen | current_seen;

1331

let either_seen = parent_seen | current_seen;

1332

if either_seen == parent_seen {

1332

if either_seen == parent_seen {

1333

continue;

1333

continue;

1334

}

1334

}

1335

seen[parent.0 as usize] = either_seen;

1335

seen[parent.0 as usize] = either_seen;

1336

interesting

1336

interesting

1337

.entry(either_seen)

1337

.entry(either_seen)

1338

.and_modify(|v| *v += 1)

1338

.and_modify(|v| *v += 1)

1339

.or_insert(1);

1339

.or_insert(1);

1340

*interesting.get_mut(&parent_seen).unwrap() -= 1;

1340

*interesting.get_mut(&parent_seen).unwrap() -= 1;

1341

if interesting[&parent_seen] == 0 {

1341

if interesting[&parent_seen] == 0 {

1342

interesting.remove(&parent_seen);

1342

interesting.remove(&parent_seen);

1343

}

1343

}

1344

}

1344

}

1345

}

1345

}

1346

*interesting.get_mut(&current_seen).unwrap() -= 1;

1346

*interesting.get_mut(&current_seen).unwrap() -= 1;

1347

if interesting[&current_seen] == 0 {

1347

if interesting[&current_seen] == 0 {

1348

interesting.remove(&current_seen);

1348

interesting.remove(&current_seen);

1349

}

1349

}

1350

1351

current_rev = Revision(current_rev.0 - 1);

1351

current_rev = Revision(current_rev.0 - 1);

1352

}

1352

}

1353

1354

if interesting.len() != 1 {

1354

if interesting.len() != 1 {

1355

return Ok(vec![]);

1355

return Ok(vec![]);

1356

}

1356

}

1357

let mask = interesting.keys().next().unwrap();

1357

let mask = interesting.keys().next().unwrap();

1358

1359

Ok(mapping

1359

Ok(mapping

1360

.into_iter()

1360

.into_iter()

1361

.filter_map(|(shift, rev)| {

1361

.filter_map(|(shift, rev)| {

1362

if (mask & shift) != 0 {

1362

if (mask & shift) != 0 {

1363

return Some(rev);

1363

return Some(rev);

1364

}

1364

}

1365

None

1365

None

1366

})

1366

})

1367

.collect())

1367

.collect())

1368

}

1368

}

1369

}

1369

}

1370

1371

/// The kind of functionality needed by find_gca_candidates

1371

/// The kind of functionality needed by find_gca_candidates

1372

///

1372

///

1373

/// This is a bit mask which can be declared to be "poisoned", which callers

1373

/// This is a bit mask which can be declared to be "poisoned", which callers

1374

/// interpret to break out of some loops.

1374

/// interpret to break out of some loops.

1375

///

1375

///

1376

/// The maximum capacity of the bit mask is up to the actual implementation

1376

/// The maximum capacity of the bit mask is up to the actual implementation

1377

trait PoisonableBitSet: Sized + PartialEq {

1377

trait PoisonableBitSet: Sized + PartialEq {

1378

/// Return a vector of exactly n elements, initialized to be empty.

1378

/// Return a vector of exactly n elements, initialized to be empty.

1379

///

1379

///

1380

/// Optimization can vastly depend on implementation. Those being `Copy`

1380

/// Optimization can vastly depend on implementation. Those being `Copy`

1381

/// and having constant capacity typically can have a very simple

1381

/// and having constant capacity typically can have a very simple

1382

/// implementation.

1382

/// implementation.

1383

fn vec_of_empty(sets_size: usize, vec_len: usize) -> Vec<Self>;

1383

fn vec_of_empty(sets_size: usize, vec_len: usize) -> Vec<Self>;

1384

1385

/// The size of the bit mask in memory

1385

/// The size of the bit mask in memory

1386

#[allow(unused)]

1386

#[allow(unused)]

1387

fn size(&self) -> usize;

1387

fn size(&self) -> usize;

1388

1389

/// The number of elements that can be represented in the set.

1389

/// The number of elements that can be represented in the set.

1390

///

1390

///

1391

/// Another way to put it is that it is the highest integer `C` such that

1391

/// Another way to put it is that it is the highest integer `C` such that

1392

/// the set is guaranteed to always be a subset of the integer range

1392

/// the set is guaranteed to always be a subset of the integer range

1393

/// `[0, C)`

1393

/// `[0, C)`

1394

#[allow(unused)]

1394

#[allow(unused)]

1395

fn capacity(&self) -> usize;

1395

fn capacity(&self) -> usize;

1396

1397

/// Declare `n` to belong to the set

1397

/// Declare `n` to belong to the set

1398

fn add(&mut self, n: usize);

1398

fn add(&mut self, n: usize);

1399

1400

/// Declare `n` not to belong to the set

1400

/// Declare `n` not to belong to the set

1401

#[allow(unused)]

1401

#[allow(unused)]

1402

fn discard(&mut self, n: usize);

1402

fn discard(&mut self, n: usize);

1403

1404

/// Replace this bit set by its union with other

1404

/// Replace this bit set by its union with other

1405

fn union(&mut self, other: &Self);

1405

fn union(&mut self, other: &Self);

1406

1407

/// Poison the bit set

1407

/// Poison the bit set

1408

///

1408

///

1409

/// Interpretation up to the caller

1409

/// Interpretation up to the caller

1410

fn poison(&mut self);

1410

fn poison(&mut self);

1411

1412

/// Is the bit set poisoned?

1412

/// Is the bit set poisoned?

1413

///

1413

///

1414

/// Interpretation is up to the caller

1414

/// Interpretation is up to the caller

1415

fn is_poisoned(&self) -> bool;

1415

fn is_poisoned(&self) -> bool;

1416

1417

/// Is the bit set empty?

1417

/// Is the bit set empty?

1418

fn is_empty(&self) -> bool;

1418

fn is_empty(&self) -> bool;

1419

1420

/// return `true` if and only if the bit is the full range `[0, n)`

1420

/// return `true` if and only if the bit is the full range `[0, n)`

1421

/// of integers

1421

/// of integers

1422

fn is_full_range(&self, n: usize) -> bool;

1422

fn is_full_range(&self, n: usize) -> bool;

1423

}

1423

}

1424

1425

const U64_POISON: u64 = 1 << 63;

1425

const U64_POISON: u64 = 1 << 63;

1426

const U8_POISON: u8 = 1 << 7;

1426

const U8_POISON: u8 = 1 << 7;

1427

1428

impl PoisonableBitSet for u64 {

1428

impl PoisonableBitSet for u64 {

1429

fn vec_of_empty(_sets_size: usize, vec_len: usize) -> Vec<Self> {

1429

fn vec_of_empty(_sets_size: usize, vec_len: usize) -> Vec<Self> {

1430

vec![0u64; vec_len]

1430

vec![0u64; vec_len]

1431

}

1431

}

1432

1433

fn size(&self) -> usize {

1433

fn size(&self) -> usize {

1434

8

1434

8

1435

}

1435

}

1436

1437

fn capacity(&self) -> usize {

1437

fn capacity(&self) -> usize {

1438

63

1438

63

1439

}

1439

}

1440

1441

fn add(&mut self, n: usize) {

1441

fn add(&mut self, n: usize) {

1442

(*self) |= 1u64 << n;

1442

(*self) |= 1u64 << n;

1443

}

1443

}

1444

1445

fn discard(&mut self, n: usize) {

1445

fn discard(&mut self, n: usize) {

1446

(*self) &= u64::MAX - (1u64 << n);

1446

(*self) &= u64::MAX - (1u64 << n);

1447

}

1447

}

1448

1449

fn union(&mut self, other: &Self) {

1449

fn union(&mut self, other: &Self) {

1450

if *self != *other {

1450

if *self != *other {

1451

(*self) |= *other;

1451

(*self) |= *other;

1452

}

1452

}

1453

}

1453

}

1454

1455

fn is_full_range(&self, n: usize) -> bool {

1455

fn is_full_range(&self, n: usize) -> bool {

1456

*self + 1 == (1u64 << n)

1456

*self + 1 == (1u64 << n)

1457

}

1457

}

1458

1459

fn is_empty(&self) -> bool {

1459

fn is_empty(&self) -> bool {

1460

*self == 0

1460

*self == 0

1461

}

1461

}

1462

1463

fn poison(&mut self) {

1463

fn poison(&mut self) {

1464

*self = U64_POISON;

1464

*self = U64_POISON;

1465

}

1465

}

1466

1467

fn is_poisoned(&self) -> bool {

1467

fn is_poisoned(&self) -> bool {

1468

// equality comparison would be tempting but would not resist

1468

// equality comparison would be tempting but would not resist

1469

// operations after poisoning (even if these should be bogus).

1469

// operations after poisoning (even if these should be bogus).

1470

*self >= U64_POISON

1470

*self >= U64_POISON

1471

}

1471

}

1472

}

1472

}

1473

1474

impl PoisonableBitSet for u8 {

1474

impl PoisonableBitSet for u8 {

1475

fn vec_of_empty(_sets_size: usize, vec_len: usize) -> Vec<Self> {

1475

fn vec_of_empty(_sets_size: usize, vec_len: usize) -> Vec<Self> {

1476

vec![0; vec_len]

1476

vec![0; vec_len]

1477

}

1477

}

1478

1479

fn size(&self) -> usize {

1479

fn size(&self) -> usize {

1480

1

1480

1

1481

}

1481

}

1482

1483

fn capacity(&self) -> usize {

1483

fn capacity(&self) -> usize {

1484

7

1484

7

1485

}

1485

}

1486

1487

fn add(&mut self, n: usize) {

1487

fn add(&mut self, n: usize) {

1488

(*self) |= 1 << n;

1488

(*self) |= 1 << n;

1489

}

1489

}

1490

1491

fn discard(&mut self, n: usize) {

1491

fn discard(&mut self, n: usize) {

1492

(*self) &= u8::MAX - (1 << n);

1492

(*self) &= u8::MAX - (1 << n);

1493

}

1493

}

1494

1495

fn union(&mut self, other: &Self) {

1495

fn union(&mut self, other: &Self) {

1496

if *self != *other {

1496

if *self != *other {

1497

(*self) |= *other;

1497

(*self) |= *other;

1498

}

1498

}

1499

}

1499

}

1500

1501

fn is_full_range(&self, n: usize) -> bool {

1501

fn is_full_range(&self, n: usize) -> bool {

1502

*self + 1 == (1 << n)

1502

*self + 1 == (1 << n)

1503

}

1503

}

1504

1505

fn is_empty(&self) -> bool {

1505

fn is_empty(&self) -> bool {

1506

*self == 0

1506

*self == 0

1507

}

1507

}

1508

1509

fn poison(&mut self) {

1509

fn poison(&mut self) {

1510

*self = U8_POISON;

1510

*self = U8_POISON;

1511

}

1511

}

1512

1513

fn is_poisoned(&self) -> bool {

1513

fn is_poisoned(&self) -> bool {

1514

// equality comparison would be tempting but would not resist

1514

// equality comparison would be tempting but would not resist

1515

// operations after poisoning (even if these should be bogus).

1515

// operations after poisoning (even if these should be bogus).

1516

*self >= U8_POISON

1516

*self >= U8_POISON

1517

}

1517

}

1518

}

1518

}

1519

1520

/// A poisonable bit set whose capacity is not known at compile time but

1520

/// A poisonable bit set whose capacity is not known at compile time but

1521

/// is constant after initial construction

1521

/// is constant after initial construction

1522

///

1522

///

1523

/// This can be way further optimized if performance assessments (speed

1523

/// This can be way further optimized if performance assessments (speed

1524

/// and/or RAM) require it.

1524

/// and/or RAM) require it.

1525

/// As far as RAM is concerned, for large vectors of these, the main problem

1525

/// As far as RAM is concerned, for large vectors of these, the main problem

1526

/// would be the repetition of set_size in each item. We would need a trait

1526

/// would be the repetition of set_size in each item. We would need a trait

1527

/// to abstract over the idea of a vector of such bit sets to do better.

1527

/// to abstract over the idea of a vector of such bit sets to do better.

1528

#[derive(Clone, PartialEq)]

1528

#[derive(Clone, PartialEq)]

1529

struct NonStaticPoisonableBitSet {

1529

struct NonStaticPoisonableBitSet {

1530

set_size: usize,

1530

set_size: usize,

1531

bit_set: Vec<u64>,

1531

bit_set: Vec<u64>,

1532

}

1532

}

1533

1534

/// Number of `u64` needed for a [`NonStaticPoisonableBitSet`] of given size

1534

/// Number of `u64` needed for a [`NonStaticPoisonableBitSet`] of given size

1535

fn non_static_poisonable_inner_len(set_size: usize) -> usize {

1535

fn non_static_poisonable_inner_len(set_size: usize) -> usize {

1536

1 + (set_size + 1) / 64

1536

1 + (set_size + 1) / 64

1537

}

1537

}

1538

1539

impl NonStaticPoisonableBitSet {

1539

impl NonStaticPoisonableBitSet {

1540

/// The index of the sub-bit set for the given n, and the index inside

1540

/// The index of the sub-bit set for the given n, and the index inside

1541

/// the latter

1541

/// the latter

1542

fn index(&self, n: usize) -> (usize, usize) {

1542

fn index(&self, n: usize) -> (usize, usize) {

1543

(n / 64, n % 64)

1543

(n / 64, n % 64)

1544

}

1544

}

1545

}

1545

}

1546

1547

/// Mock implementation to ensure that the trait makes sense

1547

/// Mock implementation to ensure that the trait makes sense

1548

impl PoisonableBitSet for NonStaticPoisonableBitSet {

1548

impl PoisonableBitSet for NonStaticPoisonableBitSet {

1549

fn vec_of_empty(set_size: usize, vec_len: usize) -> Vec<Self> {

1549

fn vec_of_empty(set_size: usize, vec_len: usize) -> Vec<Self> {

1550

let tmpl = Self {

1550

let tmpl = Self {

1551

set_size,

1551

set_size,

1552

bit_set: vec![0u64; non_static_poisonable_inner_len(set_size)],

1552

bit_set: vec![0u64; non_static_poisonable_inner_len(set_size)],

1553

};

1553

};

1554

vec![tmpl; vec_len]

1554

vec![tmpl; vec_len]

1555

}

1555

}

1556

1557

fn size(&self) -> usize {

1557

fn size(&self) -> usize {

1558

8 + self.bit_set.len() * 8

1558

8 + self.bit_set.len() * 8

1559

}

1559

}

1560

1561

fn capacity(&self) -> usize {

1561

fn capacity(&self) -> usize {

1562

self.set_size

1562

self.set_size

1563

}

1563

}

1564

1565

fn add(&mut self, n: usize) {

1565

fn add(&mut self, n: usize) {

1566

let (sub_bs, bit_pos) = self.index(n);

1566

let (sub_bs, bit_pos) = self.index(n);

1567

self.bit_set[sub_bs] |= 1 << bit_pos

1567

self.bit_set[sub_bs] |= 1 << bit_pos

1568

}

1568

}

1569

1570

fn discard(&mut self, n: usize) {

1570

fn discard(&mut self, n: usize) {

1571

let (sub_bs, bit_pos) = self.index(n);

1571

let (sub_bs, bit_pos) = self.index(n);

1572

self.bit_set[sub_bs] |= u64::MAX - (1 << bit_pos)

1572

self.bit_set[sub_bs] |= u64::MAX - (1 << bit_pos)

1573

}

1573

}

1574

1575

fn union(&mut self, other: &Self) {

1575

fn union(&mut self, other: &Self) {

1576

assert!(

1576

assert!(

1577

self.set_size == other.set_size,

1577

self.set_size == other.set_size,

1578

"Binary operations on bit sets can only be done on same size"

1578

"Binary operations on bit sets can only be done on same size"

1579

);

1579

);

1580

for i in 0..self.bit_set.len() - 1 {

1580

for i in 0..self.bit_set.len() - 1 {

1581

self.bit_set[i] |= other.bit_set[i]

1581

self.bit_set[i] |= other.bit_set[i]

1582

}

1582

}

1583

}

1583

}

1584

1585

fn is_full_range(&self, n: usize) -> bool {

1585

fn is_full_range(&self, n: usize) -> bool {

1586

let (sub_bs, bit_pos) = self.index(n);

1586

let (sub_bs, bit_pos) = self.index(n);

1587

self.bit_set[..sub_bs].iter().all(|bs| *bs == u64::MAX)

1587

self.bit_set[..sub_bs].iter().all(|bs| *bs == u64::MAX)

1588

&& self.bit_set[sub_bs] == (1 << (bit_pos + 1)) - 1

1588

&& self.bit_set[sub_bs] == (1 << (bit_pos + 1)) - 1

1589

}

1589

}

1590

1591

fn is_empty(&self) -> bool {

1591

fn is_empty(&self) -> bool {

1592

self.bit_set.iter().all(|bs| *bs == 0u64)

1592

self.bit_set.iter().all(|bs| *bs == 0u64)

1593

}

1593

}

1594

1595

fn poison(&mut self) {

1595

fn poison(&mut self) {

1596

let (sub_bs, bit_pos) = self.index(self.set_size);

1596

let (sub_bs, bit_pos) = self.index(self.set_size);

1597

self.bit_set[sub_bs] = 1 << bit_pos;

1597

self.bit_set[sub_bs] = 1 << bit_pos;

1598

}

1598

}

1599

1600

fn is_poisoned(&self) -> bool {

1600

fn is_poisoned(&self) -> bool {

1601

let (sub_bs, bit_pos) = self.index(self.set_size);

1601

let (sub_bs, bit_pos) = self.index(self.set_size);

1602

self.bit_set[sub_bs] >= 1 << bit_pos

1602

self.bit_set[sub_bs] >= 1 << bit_pos

1603

}

1603

}

1604

}

1604

}

1605

1606

/// Set of roots of all non-public phases

1606

/// Set of roots of all non-public phases

1607

pub type RootsPerPhase = [Vec<Revision>; Phase::non_public_phases().len()];

1607

pub type RootsPerPhase = [Vec<Revision>; Phase::non_public_phases().len()];

1608

1609

#[derive(Debug, Copy, Clone, PartialEq, Eq, Ord, PartialOrd, Hash)]

1609

#[derive(Debug, Copy, Clone, PartialEq, Eq, Ord, PartialOrd, Hash)]

1610

pub enum Phase {

1610

pub enum Phase {

1611

Public = 0,

1611

Public = 0,

1612

Draft = 1,

1612

Draft = 1,

1613

Secret = 2,

1613

Secret = 2,

1614

Archived = 3,

1614

Archived = 3,

1615

Internal = 4,

1615

Internal = 4,

1616

}

1616

}

1617

1618

impl TryFrom<usize> for Phase {

1618

impl TryFrom<usize> for Phase {

1619

type Error = RevlogError;

1619

type Error = RevlogError;

1620

1621

fn try_from(value: usize) -> Result<Self, Self::Error> {

1621

fn try_from(value: usize) -> Result<Self, Self::Error> {

1622

Ok(match value {

1622

Ok(match value {

1623

0 => Self::Public,

1623

0 => Self::Public,

1624

1 => Self::Draft,

1624

1 => Self::Draft,

1625

2 => Self::Secret,

1625

2 => Self::Secret,

1626

32 => Self::Archived,

1626

32 => Self::Archived,

1627

96 => Self::Internal,

1627

96 => Self::Internal,

1628

v => {

1628

v => {

1629

return Err(RevlogError::corrupted(format!(

1629

return Err(RevlogError::corrupted(format!(

1630

"invalid phase value {}",

1630

"invalid phase value {}",

1631

v

1631

v

1632

)))

1632

)))

1633

}

1633

}

1634

})

1634

})

1635

}

1635

}

1636

}

1636

}

1637

1638

impl Phase {

1638

impl Phase {

1639

pub const fn all_phases() -> &'static [Self] {

1639

pub const fn all_phases() -> &'static [Self] {

1640

&[

1640

&[

1641

Self::Public,

1641

Self::Public,

1642

Self::Draft,

1642

Self::Draft,

1643

Self::Secret,

1643

Self::Secret,

1644

Self::Archived,

1644

Self::Archived,

1645

Self::Internal,

1645

Self::Internal,

1646

]

1646

]

1647

}

1647

}

1648

pub const fn non_public_phases() -> &'static [Self] {

1648

pub const fn non_public_phases() -> &'static [Self] {

1649

&[Self::Draft, Self::Secret, Self::Archived, Self::Internal]

1649

&[Self::Draft, Self::Secret, Self::Archived, Self::Internal]

1650

}

1650

}

1651

}

1651

}

1652

1653

fn inline_scan(bytes: &[u8]) -> (usize, Vec<usize>) {

1653

fn inline_scan(bytes: &[u8]) -> (usize, Vec<usize>) {

1654

let mut offset: usize = 0;

1654

let mut offset: usize = 0;

1655

let mut offsets = Vec::new();

1655

let mut offsets = Vec::new();

1656

1657

while offset + INDEX_ENTRY_SIZE <= bytes.len() {

1657

while offset + INDEX_ENTRY_SIZE <= bytes.len() {

1658

offsets.push(offset);

1658

offsets.push(offset);

1659

let end = offset + INDEX_ENTRY_SIZE;

1659

let end = offset + INDEX_ENTRY_SIZE;

1660

let entry = IndexEntry {

1660

let entry = IndexEntry {

1661

bytes: &bytes[offset..end],

1661

bytes: &bytes[offset..end],

1662

};

1662

};

1663

1664

offset += INDEX_ENTRY_SIZE + entry.compressed_len() as usize;

1664

offset += INDEX_ENTRY_SIZE + entry.compressed_len() as usize;

1665

}

1665

}

1666

(offset, offsets)

1666

(offset, offsets)

1667

}

1667

}

1668

1669

impl super::RevlogIndex for Index {

1669

impl super::RevlogIndex for Index {

1670

fn len(&self) -> usize {

1670

fn len(&self) -> usize {

1671

self.len()

1671

self.len()

1672

}

1672

}

1673

1674

fn node(&self, rev: Revision) -> Option<&Node> {

1674

fn node(&self, rev: Revision) -> Option<&Node> {

1675

if rev == NULL_REVISION {

1675

if rev == NULL_REVISION {

1676

return Some(&NULL_NODE);

1676

return Some(&NULL_NODE);

1677

}

1677

}

1678

self.get_entry(rev).map(|entry| entry.hash())

1678

self.get_entry(rev).map(|entry| entry.hash())

1679

}

1679

}

1680

}

1680

}

1681

1682

#[derive(Debug)]

1682

#[derive(Debug)]

1683

pub struct IndexEntry<'a> {

1683

pub struct IndexEntry<'a> {

1684

bytes: &'a [u8],

1684

bytes: &'a [u8],

1685

}

1685

}

1686

1687

impl<'a> IndexEntry<'a> {

1687

impl<'a> IndexEntry<'a> {

1688

/// Return the offset of the data.

1688

/// Return the offset of the data.

1689

pub fn offset(&self) -> usize {

1689

pub fn offset(&self) -> usize {

1690

let mut bytes = [0; 8];

1690

let mut bytes = [0; 8];

1691

bytes[2..8].copy_from_slice(&self.bytes[0..=5]);

1691

bytes[2..8].copy_from_slice(&self.bytes[0..=5]);

1692

BigEndian::read_u64(&bytes[..]) as usize

1692

BigEndian::read_u64(&bytes[..]) as usize

1693

}

1693

}

1694

pub fn raw_offset(&self) -> u64 {

1694

pub fn raw_offset(&self) -> u64 {

1695

BigEndian::read_u64(&self.bytes[0..8])

1695

BigEndian::read_u64(&self.bytes[0..8])

1696

}

1696

}

1697

1698

/// Same result (except potentially for rev 0) as C `index_get_start()`

1698

/// Same result (except potentially for rev 0) as C `index_get_start()`

1699

fn c_start(&self) -> u64 {

1699

fn c_start(&self) -> u64 {

1700

self.raw_offset() >> 16

1700

self.raw_offset() >> 16

1701

}

1701

}

1702

1703

pub fn flags(&self) -> u16 {

1703

pub fn flags(&self) -> u16 {

1704

BigEndian::read_u16(&self.bytes[6..=7])

1704

BigEndian::read_u16(&self.bytes[6..=7])

1705

}

1705

}

1706

1707

/// Return the compressed length of the data.

1707

/// Return the compressed length of the data.

1708

pub fn compressed_len(&self) -> u32 {

1708

pub fn compressed_len(&self) -> u32 {

1709

BigEndian::read_u32(&self.bytes[8..=11])

1709

BigEndian::read_u32(&self.bytes[8..=11])

1710

}

1710

}

1711

1712

/// Return the uncompressed length of the data.

1712

/// Return the uncompressed length of the data.

1713

pub fn uncompressed_len(&self) -> i32 {

1713

pub fn uncompressed_len(&self) -> i32 {

1714

BigEndian::read_i32(&self.bytes[12..=15])

1714

BigEndian::read_i32(&self.bytes[12..=15])

1715

}

1715

}

1716

1717

/// Return the revision upon which the data has been derived.

1717

/// Return the revision upon which the data has been derived.

1718

pub fn base_revision_or_base_of_delta_chain(&self) -> UncheckedRevision {

1718

pub fn base_revision_or_base_of_delta_chain(&self) -> UncheckedRevision {

1719

// TODO Maybe return an Option when base_revision == rev?

1719

// TODO Maybe return an Option when base_revision == rev?

1720

// Requires to add rev to IndexEntry

1720

// Requires to add rev to IndexEntry

1721

1722

BigEndian::read_i32(&self.bytes[16..]).into()

1722

BigEndian::read_i32(&self.bytes[16..]).into()

1723

}

1723

}

1724

1725

pub fn link_revision(&self) -> UncheckedRevision {

1725

pub fn link_revision(&self) -> UncheckedRevision {

1726

BigEndian::read_i32(&self.bytes[20..]).into()

1726

BigEndian::read_i32(&self.bytes[20..]).into()

1727

}

1727

}

1728

1729

pub fn p1(&self) -> UncheckedRevision {

1729

pub fn p1(&self) -> UncheckedRevision {

1730

BigEndian::read_i32(&self.bytes[24..]).into()

1730

BigEndian::read_i32(&self.bytes[24..]).into()

1731

}

1731

}

1732

1733

pub fn p2(&self) -> UncheckedRevision {

1733

pub fn p2(&self) -> UncheckedRevision {

1734

BigEndian::read_i32(&self.bytes[28..]).into()

1734

BigEndian::read_i32(&self.bytes[28..]).into()

1735

}

1735

}

1736

1737

/// Return the hash of revision's full text.

1737

/// Return the hash of revision's full text.

1738

///

1738

///

1739

/// Currently, SHA-1 is used and only the first 20 bytes of this field

1739

/// Currently, SHA-1 is used and only the first 20 bytes of this field

1740

/// are used.

1740

/// are used.

1741

pub fn hash(&self) -> &'a Node {

1741

pub fn hash(&self) -> &'a Node {

1742

(&self.bytes[32..52]).try_into().unwrap()

1742

(&self.bytes[32..52]).try_into().unwrap()

1743

}

1743

}

1744

1745

pub fn as_bytes(&self) -> &'a [u8] {

1745

pub fn as_bytes(&self) -> &'a [u8] {

1746

self.bytes

1746

self.bytes

1747

}

1747

}

1748

}

1748

}

1749

1750

#[cfg(test)]

1750

#[cfg(test)]

1751

pub use tests::IndexEntryBuilder;

1751

pub use tests::IndexEntryBuilder;

1752

1753

#[cfg(test)]

1753

#[cfg(test)]

1754

mod tests {

1754

mod tests {

1755

use super::*;

1755

use super::*;

1756

use crate::node::NULL_NODE;

1756

use crate::node::NULL_NODE;

1757

1758

#[cfg(test)]

1758

#[cfg(test)]

1759

#[derive(Debug, Copy, Clone)]

1759

#[derive(Debug, Copy, Clone)]

1760

pub struct IndexEntryBuilder {

1760

pub struct IndexEntryBuilder {

1761

is_first: bool,

1761

is_first: bool,

1762

is_inline: bool,

1762

is_inline: bool,

1763

is_general_delta: bool,

1763

is_general_delta: bool,

1764

version: u16,

1764

version: u16,

1765

offset: usize,

1765

offset: usize,

1766

compressed_len: usize,

1766

compressed_len: usize,

1767

uncompressed_len: usize,

1767

uncompressed_len: usize,

1768

base_revision_or_base_of_delta_chain: Revision,

1768

base_revision_or_base_of_delta_chain: Revision,

1769

link_revision: Revision,

1769

link_revision: Revision,

1770

p1: Revision,

1770

p1: Revision,

1771

p2: Revision,

1771

p2: Revision,

1772

node: Node,

1772

node: Node,

1773

}

1773

}

1774

1775

#[cfg(test)]

1775

#[cfg(test)]

1776

impl IndexEntryBuilder {

1776

impl IndexEntryBuilder {

1777

#[allow(clippy::new_without_default)]

1777

#[allow(clippy::new_without_default)]

1778

pub fn new() -> Self {

1778

pub fn new() -> Self {

1779

Self {

1779

Self {

1780

is_first: false,

1780

is_first: false,

1781

is_inline: false,

1781

is_inline: false,

1782

is_general_delta: true,

1782

is_general_delta: true,

1783

version: 1,

1783

version: 1,

1784

offset: 0,

1784

offset: 0,

1785

compressed_len: 0,

1785

compressed_len: 0,

1786

uncompressed_len: 0,

1786

uncompressed_len: 0,

1787

base_revision_or_base_of_delta_chain: Revision(0),

1787

base_revision_or_base_of_delta_chain: Revision(0),

1788

link_revision: Revision(0),

1788

link_revision: Revision(0),

1789

p1: NULL_REVISION,

1789

p1: NULL_REVISION,

1790

p2: NULL_REVISION,

1790

p2: NULL_REVISION,

1791

node: NULL_NODE,

1791

node: NULL_NODE,

1792

}

1792

}

1793

}

1793

}

1794

1795

pub fn is_first(&mut self, value: bool) -> &mut Self {

1795

pub fn is_first(&mut self, value: bool) -> &mut Self {

1796

self.is_first = value;

1796

self.is_first = value;

1797

self

1797

self

1798

}

1798

}

1799

1800

pub fn with_inline(&mut self, value: bool) -> &mut Self {

1800

pub fn with_inline(&mut self, value: bool) -> &mut Self {

1801

self.is_inline = value;

1801

self.is_inline = value;

1802

self

1802

self

1803

}

1803

}

1804

1805

pub fn with_general_delta(&mut self, value: bool) -> &mut Self {

1805

pub fn with_general_delta(&mut self, value: bool) -> &mut Self {

1806

self.is_general_delta = value;

1806

self.is_general_delta = value;

1807

self

1807

self

1808

}

1808

}

1809

1810

pub fn with_version(&mut self, value: u16) -> &mut Self {

1810

pub fn with_version(&mut self, value: u16) -> &mut Self {

1811

self.version = value;

1811

self.version = value;

1812

self

1812

self

1813

}

1813

}

1814

1815

pub fn with_offset(&mut self, value: usize) -> &mut Self {

1815

pub fn with_offset(&mut self, value: usize) -> &mut Self {

1816

self.offset = value;

1816

self.offset = value;

1817

self

1817

self

1818

}

1818

}

1819

1820

pub fn with_compressed_len(&mut self, value: usize) -> &mut Self {

1820

pub fn with_compressed_len(&mut self, value: usize) -> &mut Self {

1821

self.compressed_len = value;

1821

self.compressed_len = value;

1822

self

1822

self

1823

}

1823

}

1824

1825

pub fn with_uncompressed_len(&mut self, value: usize) -> &mut Self {

1825

pub fn with_uncompressed_len(&mut self, value: usize) -> &mut Self {

1826

self.uncompressed_len = value;

1826

self.uncompressed_len = value;

1827

self

1827

self

1828

}

1828

}

1829

1830

pub fn with_base_revision_or_base_of_delta_chain(

1830

pub fn with_base_revision_or_base_of_delta_chain(

1831

&mut self,

1831

&mut self,

1832

value: Revision,

1832

value: Revision,

1833

) -> &mut Self {

1833

) -> &mut Self {

1834

self.base_revision_or_base_of_delta_chain = value;

1834

self.base_revision_or_base_of_delta_chain = value;

1835

self

1835

self

1836

}

1836

}

1837

1838

pub fn with_link_revision(&mut self, value: Revision) -> &mut Self {

1838

pub fn with_link_revision(&mut self, value: Revision) -> &mut Self {

1839

self.link_revision = value;

1839

self.link_revision = value;

1840

self

1840

self

1841

}

1841

}

1842

1843

pub fn with_p1(&mut self, value: Revision) -> &mut Self {

1843

pub fn with_p1(&mut self, value: Revision) -> &mut Self {

1844

self.p1 = value;

1844

self.p1 = value;

1845

self

1845

self

1846

}

1846

}

1847

1848

pub fn with_p2(&mut self, value: Revision) -> &mut Self {

1848

pub fn with_p2(&mut self, value: Revision) -> &mut Self {

1849

self.p2 = value;

1849

self.p2 = value;

1850

self

1850

self

1851

}

1851

}

1852

1853

pub fn with_node(&mut self, value: Node) -> &mut Self {

1853

pub fn with_node(&mut self, value: Node) -> &mut Self {

1854

self.node = value;

1854

self.node = value;

1855

self

1855

self

1856

}

1856

}

1857

1858

pub fn build(&self) -> Vec<u8> {

1858

pub fn build(&self) -> Vec<u8> {

1859

let mut bytes = Vec::with_capacity(INDEX_ENTRY_SIZE);

1859

let mut bytes = Vec::with_capacity(INDEX_ENTRY_SIZE);

1860

if self.is_first {

1860

if self.is_first {

1861

bytes.extend(match (self.is_general_delta, self.is_inline) {

1861

bytes.extend(match (self.is_general_delta, self.is_inline) {

1862

(false, false) => [0u8, 0],

1862

(false, false) => [0u8, 0],

1863

(false, true) => [0u8, 1],

1863

(false, true) => [0u8, 1],

1864

(true, false) => [0u8, 2],

1864

(true, false) => [0u8, 2],

1865

(true, true) => [0u8, 3],

1865

(true, true) => [0u8, 3],

1866

});

1866

});

1867

bytes.extend(self.version.to_be_bytes());

1867

bytes.extend(self.version.to_be_bytes());

1868

// Remaining offset bytes.

1868

// Remaining offset bytes.

1869

bytes.extend([0u8; 2]);

1869

bytes.extend([0u8; 2]);

1870

} else {

1870

} else {

1871

// Offset stored on 48 bits (6 bytes)

1871

// Offset stored on 48 bits (6 bytes)

1872

bytes.extend(&(self.offset as u64).to_be_bytes()[2..]);

1872

bytes.extend(&(self.offset as u64).to_be_bytes()[2..]);

1873

}

1873

}

1874

bytes.extend([0u8; 2]); // Revision flags.

1874

bytes.extend([0u8; 2]); // Revision flags.

1875

bytes.extend((self.compressed_len as u32).to_be_bytes());

1875

bytes.extend((self.compressed_len as u32).to_be_bytes());

1876

bytes.extend((self.uncompressed_len as u32).to_be_bytes());

1876

bytes.extend((self.uncompressed_len as u32).to_be_bytes());

1877

bytes.extend(

1877

bytes.extend(

1878

self.base_revision_or_base_of_delta_chain.0.to_be_bytes(),

1878

self.base_revision_or_base_of_delta_chain.0.to_be_bytes(),

1879

);

1879

);

1880

bytes.extend(self.link_revision.0.to_be_bytes());

1880

bytes.extend(self.link_revision.0.to_be_bytes());

1881

bytes.extend(self.p1.0.to_be_bytes());

1881

bytes.extend(self.p1.0.to_be_bytes());

1882

bytes.extend(self.p2.0.to_be_bytes());

1882

bytes.extend(self.p2.0.to_be_bytes());

1883

bytes.extend(self.node.as_bytes());

1883

bytes.extend(self.node.as_bytes());

1884

bytes.extend(vec![0u8; 12]);

1884

bytes.extend(vec![0u8; 12]);

1885

bytes

1885

bytes

1886

}

1886

}

1887

}

1887

}

1888

1889

pub fn is_inline(index_bytes: &[u8]) -> bool {

1889

pub fn is_inline(index_bytes: &[u8]) -> bool {

1890

IndexHeader::parse(index_bytes)

1890

IndexHeader::parse(index_bytes)

1891

.expect("too short")

1891

.expect("too short")

1892

.unwrap()

1892

.unwrap()

1893

.format_flags()

1893

.format_flags()

1894

.is_inline()

1894

.is_inline()

1895

}

1895

}

1896

1897

pub fn uses_generaldelta(index_bytes: &[u8]) -> bool {

1897

pub fn uses_generaldelta(index_bytes: &[u8]) -> bool {

1898

IndexHeader::parse(index_bytes)

1898

IndexHeader::parse(index_bytes)

1899

.expect("too short")

1899

.expect("too short")

1900

.unwrap()

1900

.unwrap()

1901

.format_flags()

1901

.format_flags()

1902

.uses_generaldelta()

1902

.uses_generaldelta()

1903

}

1903

}

1904

1905

pub fn get_version(index_bytes: &[u8]) -> u16 {

1905

pub fn get_version(index_bytes: &[u8]) -> u16 {

1906

IndexHeader::parse(index_bytes)

1906

IndexHeader::parse(index_bytes)

1907

.expect("too short")

1907

.expect("too short")

1908

.unwrap()

1908

.unwrap()

1909

.format_version()

1909

.format_version()

1910

}

1910

}

1911

1912

#[test]

1912

#[test]

1913

fn flags_when_no_inline_flag_test() {

1913

fn flags_when_no_inline_flag_test() {

1914

let bytes = IndexEntryBuilder::new()

1914

let bytes = IndexEntryBuilder::new()

1915

.is_first(true)

1915

.is_first(true)

1916

.with_general_delta(false)

1916

.with_general_delta(false)

1917

.with_inline(false)

1917

.with_inline(false)

1918

.build();

1918

.build();

1919

1920

assert!(!is_inline(&bytes));

1920

assert!(!is_inline(&bytes));

1921

assert!(!uses_generaldelta(&bytes));

1921

assert!(!uses_generaldelta(&bytes));

1922

}

1922

}

1923

1924

#[test]

1924

#[test]

1925

fn flags_when_inline_flag_test() {

1925

fn flags_when_inline_flag_test() {

1926

let bytes = IndexEntryBuilder::new()

1926

let bytes = IndexEntryBuilder::new()

1927

.is_first(true)

1927

.is_first(true)

1928

.with_general_delta(false)

1928

.with_general_delta(false)

1929

.with_inline(true)

1929

.with_inline(true)

1930

.build();

1930

.build();

1931

1932

assert!(is_inline(&bytes));

1932

assert!(is_inline(&bytes));

1933

assert!(!uses_generaldelta(&bytes));

1933

assert!(!uses_generaldelta(&bytes));

1934

}

1934

}

1935

1936

#[test]

1936

#[test]

1937

fn flags_when_inline_and_generaldelta_flags_test() {

1937

fn flags_when_inline_and_generaldelta_flags_test() {

1938

let bytes = IndexEntryBuilder::new()

1938

let bytes = IndexEntryBuilder::new()

1939

.is_first(true)

1939

.is_first(true)

1940

.with_general_delta(true)

1940

.with_general_delta(true)

1941

.with_inline(true)

1941

.with_inline(true)

1942

.build();

1942

.build();

1943

1944

assert!(is_inline(&bytes));

1944

assert!(is_inline(&bytes));

1945

assert!(uses_generaldelta(&bytes));

1945

assert!(uses_generaldelta(&bytes));

1946

}

1946

}

1947

1948

#[test]

1948

#[test]

1949

fn test_offset() {

1949

fn test_offset() {

1950

let bytes = IndexEntryBuilder::new().with_offset(1).build();

1950

let bytes = IndexEntryBuilder::new().with_offset(1).build();

1951

let entry = IndexEntry { bytes: &bytes };

1951

let entry = IndexEntry { bytes: &bytes };

1952

1953

assert_eq!(entry.offset(), 1)

1953

assert_eq!(entry.offset(), 1)

1954

}

1954

}

1955

1956

#[test]

1956

#[test]

1957

fn test_compressed_len() {

1957

fn test_compressed_len() {

1958

let bytes = IndexEntryBuilder::new().with_compressed_len(1).build();

1958

let bytes = IndexEntryBuilder::new().with_compressed_len(1).build();

1959

let entry = IndexEntry { bytes: &bytes };

1959

let entry = IndexEntry { bytes: &bytes };

1960

1961

assert_eq!(entry.compressed_len(), 1)

1961

assert_eq!(entry.compressed_len(), 1)

1962

}

1962

}

1963

1964

#[test]

1964

#[test]

1965

fn test_uncompressed_len() {

1965

fn test_uncompressed_len() {

1966

let bytes = IndexEntryBuilder::new().with_uncompressed_len(1).build();

1966

let bytes = IndexEntryBuilder::new().with_uncompressed_len(1).build();

1967

let entry = IndexEntry { bytes: &bytes };

1967

let entry = IndexEntry { bytes: &bytes };

1968

1969

assert_eq!(entry.uncompressed_len(), 1)

1969

assert_eq!(entry.uncompressed_len(), 1)

1970

}

1970

}

1971

1972

#[test]

1972

#[test]

1973

fn test_base_revision_or_base_of_delta_chain() {

1973

fn test_base_revision_or_base_of_delta_chain() {

1974

let bytes = IndexEntryBuilder::new()

1974

let bytes = IndexEntryBuilder::new()

1975

.with_base_revision_or_base_of_delta_chain(Revision(1))

1975

.with_base_revision_or_base_of_delta_chain(Revision(1))

1976

.build();

1976

.build();

1977

let entry = IndexEntry { bytes: &bytes };

1977

let entry = IndexEntry { bytes: &bytes };

1978

1979

assert_eq!(entry.base_revision_or_base_of_delta_chain(), 1.into())

1979

assert_eq!(entry.base_revision_or_base_of_delta_chain(), 1.into())

1980

}

1980

}

1981

1982

#[test]

1982

#[test]

1983

fn link_revision_test() {

1983

fn link_revision_test() {

1984

let bytes = IndexEntryBuilder::new()

1984

let bytes = IndexEntryBuilder::new()

1985

.with_link_revision(Revision(123))

1985

.with_link_revision(Revision(123))

1986

.build();

1986

.build();

1987

1988

let entry = IndexEntry { bytes: &bytes };

1988

let entry = IndexEntry { bytes: &bytes };

1989

1990

assert_eq!(entry.link_revision(), 123.into());

1990

assert_eq!(entry.link_revision(), 123.into());

1991

}

1991

}

1992

1993

#[test]

1993

#[test]

1994

fn p1_test() {

1994

fn p1_test() {

1995

let bytes = IndexEntryBuilder::new().with_p1(Revision(123)).build();

1995

let bytes = IndexEntryBuilder::new().with_p1(Revision(123)).build();

1996

1997

let entry = IndexEntry { bytes: &bytes };

1997

let entry = IndexEntry { bytes: &bytes };

1998

1999

assert_eq!(entry.p1(), 123.into());

1999

assert_eq!(entry.p1(), 123.into());

2000

}

2000

}

2001

2002

#[test]

2002

#[test]

2003

fn p2_test() {

2003

fn p2_test() {

2004

let bytes = IndexEntryBuilder::new().with_p2(Revision(123)).build();

2004

let bytes = IndexEntryBuilder::new().with_p2(Revision(123)).build();

2005

2006

let entry = IndexEntry { bytes: &bytes };

2006

let entry = IndexEntry { bytes: &bytes };

2007

2008

assert_eq!(entry.p2(), 123.into());

2008

assert_eq!(entry.p2(), 123.into());

2009

}

2009

}

2010

2011

#[test]

2011

#[test]

2012

fn node_test() {

2012

fn node_test() {

2013

let node = Node::from_hex("0123456789012345678901234567890123456789")

2013

let node = Node::from_hex("0123456789012345678901234567890123456789")

2014

.unwrap();

2014

.unwrap();

2015

let bytes = IndexEntryBuilder::new().with_node(node).build();

2015

let bytes = IndexEntryBuilder::new().with_node(node).build();

2016

2017

let entry = IndexEntry { bytes: &bytes };

2017

let entry = IndexEntry { bytes: &bytes };

2018

2019

assert_eq!(*entry.hash(), node);

2019

assert_eq!(*entry.hash(), node);

2020

}

2020

}

2021

2022

#[test]

2022

#[test]

2023

fn version_test() {

2023

fn version_test() {

2024

let bytes = IndexEntryBuilder::new()

2024

let bytes = IndexEntryBuilder::new()

2025

.is_first(true)

2025

.is_first(true)

2026

.with_version(2)

2026

.with_version(2)

2027

.build();

2027

.build();

2028

2029

assert_eq!(get_version(&bytes), 2)

2029

assert_eq!(get_version(&bytes), 2)

2030

}

2030

}

2031

}

2031

}

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

             use std::collections::{HashMap, HashSet};
             use std::fmt::Debug;
             use std::ops::Deref;
             use std::sync::{RwLock, RwLockReadGuard, RwLockWriteGuard};
             use bitvec::prelude::*;
             use byteorder::{BigEndian, ByteOrder};
             use bytes_cast::{unaligned, BytesCast};
             use super::REVIDX_KNOWN_FLAGS;
             use crate::errors::HgError;
             use crate::node::{NODE_BYTES_LENGTH, NULL_NODE, STORED_NODE_ID_BYTES};
             use crate::revlog::node::Node;
             use crate::revlog::{Revision, NULL_REVISION};
             use crate::{
                 dagops, BaseRevision, FastHashMap, Graph, GraphError, RevlogError,
                 RevlogIndex, UncheckedRevision,
             };
             pub const INDEX_ENTRY_SIZE: usize = 64;
             pub const INDEX_HEADER_SIZE: usize = 4;
             pub const COMPRESSION_MODE_INLINE: u8 = 2;
             #[derive(Debug)]
             pub struct IndexHeader {
                 pub(super) header_bytes: [u8; INDEX_HEADER_SIZE],
             }
-            #[derive(Copy, Clone)]
+            #[derive(Copy, Clone, Debug)]
             pub struct IndexHeaderFlags {
                 flags: u16,
             }
             /// Corresponds to the high bits of `_format_flags` in python
             impl IndexHeaderFlags {
                 /// Corresponds to FLAG_INLINE_DATA in python
                 pub fn is_inline(self) -> bool {
                     self.flags & 1 != 0
                 }
                 /// Corresponds to FLAG_GENERALDELTA in python
                 pub fn uses_generaldelta(self) -> bool {
                     self.flags & 2 != 0
                 }
             }
             /// Corresponds to the INDEX_HEADER structure,
             /// which is parsed as a `header` variable in `_loadindex` in `revlog.py`
             impl IndexHeader {
                 fn format_flags(&self) -> IndexHeaderFlags {
                     // No "unknown flags" check here, unlike in python. Maybe there should
                     // be.
                     IndexHeaderFlags {
                         flags: BigEndian::read_u16(&self.header_bytes[0..2]),
                     }
                 }
                 /// The only revlog version currently supported by rhg.
                 const REVLOGV1: u16 = 1;
                 /// Corresponds to `_format_version` in Python.
                 fn format_version(&self) -> u16 {
                     BigEndian::read_u16(&self.header_bytes[2..4])
                 }
                 pub fn parse(index_bytes: &[u8]) -> Result<Option<IndexHeader>, HgError> {
                     if index_bytes.is_empty() {
                         return Ok(None);
                     }
                     if index_bytes.len() < 4 {
                         return Err(HgError::corrupted(
                             "corrupted revlog: can't read the index format header",
                         ));
                     }
                     Ok(Some(IndexHeader {
                         header_bytes: {
                             let bytes: [u8; 4] =
                                 index_bytes[0..4].try_into().expect("impossible");
                             bytes
                         },
                     }))
                 }
             }
             /// Abstracts the access to the index bytes since they can be spread between
             /// the immutable (bytes) part and the mutable (added) part if any appends
             /// happened. This makes it transparent for the callers.
             struct IndexData {
                 /// Immutable bytes, most likely taken from disk
                 bytes: Box<dyn Deref<Target = [u8]> + Send + Sync>,
                 /// Used when stripping index contents, keeps track of the start of the
                 /// first stripped revision, which is used to give a slice of the
                 /// `bytes` field.
                 truncation: Option<usize>,
                 /// Bytes that were added after reading the index
                 added: Vec<u8>,
                 first_entry: [u8; INDEX_ENTRY_SIZE],
             }
             impl IndexData {
                 pub fn new(bytes: Box<dyn Deref<Target = [u8]> + Send + Sync>) -> Self {
                     let mut first_entry = [0; INDEX_ENTRY_SIZE];
                     if bytes.len() >= INDEX_ENTRY_SIZE {
                         first_entry[INDEX_HEADER_SIZE..]
                             .copy_from_slice(&bytes[INDEX_HEADER_SIZE..INDEX_ENTRY_SIZE])
                     }
                     Self {
                         bytes,
                         truncation: None,
                         added: vec![],
                         first_entry,
                     }
                 }
                 pub fn len(&self) -> usize {
                     match self.truncation {
                         Some(truncation) => truncation + self.added.len(),
                         None => self.bytes.len() + self.added.len(),
                     }
                 }
                 fn remove(
                     &mut self,
                     rev: Revision,
                     offsets: Option<&[usize]>,
                 ) -> Result<(), RevlogError> {
                     let rev = rev.0 as usize;
                     let truncation = if let Some(offsets) = offsets {
                         offsets[rev]
                     } else {
                         rev * INDEX_ENTRY_SIZE
                     };
                     if truncation < self.bytes.len() {
                         self.truncation = Some(truncation);
                         self.added.clear();
                     } else {
                         self.added.truncate(truncation - self.bytes.len());
                     }
                     Ok(())
                 }
                 fn is_new(&self) -> bool {
                     self.bytes.is_empty()
                 }
             }
             impl std::ops::Index<std::ops::Range<usize>> for IndexData {
                 type Output = [u8];
                 fn index(&self, index: std::ops::Range<usize>) -> &Self::Output {
                     let start = index.start;
                     let end = index.end;
                     let immutable_len = match self.truncation {
                         Some(truncation) => truncation,
                         None => self.bytes.len(),
                     };
                     if start < immutable_len {
                         if end > immutable_len {
                             panic!("index data cannot span existing and added ranges");
                         }
                         &self.bytes[index]
                     } else {
                         &self.added[start - immutable_len..end - immutable_len]
                     }
                 }
             }
             #[derive(Debug, PartialEq, Eq)]
             pub struct RevisionDataParams {
                 pub flags: u16,
                 pub data_offset: u64,
                 pub data_compressed_length: i32,
                 pub data_uncompressed_length: i32,
                 pub data_delta_base: i32,
                 pub link_rev: i32,
                 pub parent_rev_1: i32,
                 pub parent_rev_2: i32,
                 pub node_id: [u8; NODE_BYTES_LENGTH],
                 pub _sidedata_offset: u64,
                 pub _sidedata_compressed_length: i32,
                 pub data_compression_mode: u8,
                 pub _sidedata_compression_mode: u8,
                 pub _rank: i32,
             }
             impl Default for RevisionDataParams {
                 fn default() -> Self {
                     Self {
                         flags: 0,
                         data_offset: 0,
                         data_compressed_length: 0,
                         data_uncompressed_length: 0,
                         data_delta_base: -1,
                         link_rev: -1,
                         parent_rev_1: -1,
                         parent_rev_2: -1,
                         node_id: [0; NODE_BYTES_LENGTH],
                         _sidedata_offset: 0,
                         _sidedata_compressed_length: 0,
                         data_compression_mode: COMPRESSION_MODE_INLINE,
                         _sidedata_compression_mode: COMPRESSION_MODE_INLINE,
                         _rank: -1,
                     }
                 }
             }
             #[derive(BytesCast)]
             #[repr(C)]
             pub struct RevisionDataV1 {
                 data_offset_or_flags: unaligned::U64Be,
                 data_compressed_length: unaligned::I32Be,
                 data_uncompressed_length: unaligned::I32Be,
                 data_delta_base: unaligned::I32Be,
                 link_rev: unaligned::I32Be,
                 parent_rev_1: unaligned::I32Be,
                 parent_rev_2: unaligned::I32Be,
                 node_id: [u8; STORED_NODE_ID_BYTES],
             }
             fn _static_assert_size_of_revision_data_v1() {
                 let _ = std::mem::transmute::<RevisionDataV1, [u8; 64]>;
             }
             impl RevisionDataParams {
                 pub fn validate(&self) -> Result<(), RevlogError> {
                     if self.flags & !REVIDX_KNOWN_FLAGS != 0 {
                         return Err(RevlogError::corrupted(format!(
                             "unknown revlog index flags: {}",
                             self.flags
                         )));
                     }
                     if self.data_compression_mode != COMPRESSION_MODE_INLINE {
                         return Err(RevlogError::corrupted(format!(
                             "invalid data compression mode: {}",
                             self.data_compression_mode
                         )));
                     }
                     // FIXME isn't this only for v2 or changelog v2?
                     if self._sidedata_compression_mode != COMPRESSION_MODE_INLINE {
                         return Err(RevlogError::corrupted(format!(
                             "invalid sidedata compression mode: {}",
                             self._sidedata_compression_mode
                         )));
                     }
                     Ok(())
                 }
                 pub fn into_v1(self) -> RevisionDataV1 {
                     let data_offset_or_flags = self.data_offset << 16 | self.flags as u64;
                     let mut node_id = [0; STORED_NODE_ID_BYTES];
                     node_id[..NODE_BYTES_LENGTH].copy_from_slice(&self.node_id);
                     RevisionDataV1 {
                         data_offset_or_flags: data_offset_or_flags.into(),
                         data_compressed_length: self.data_compressed_length.into(),
                         data_uncompressed_length: self.data_uncompressed_length.into(),
                         data_delta_base: self.data_delta_base.into(),
                         link_rev: self.link_rev.into(),
                         parent_rev_1: self.parent_rev_1.into(),
                         parent_rev_2: self.parent_rev_2.into(),
                         node_id,
                     }
                 }
             }
             /// A Revlog index
             pub struct Index {
                 bytes: IndexData,
                 /// Offsets of starts of index blocks.
                 /// Only needed when the index is interleaved with data.
                 offsets: RwLock<Option<Vec<usize>>>,
                 uses_generaldelta: bool,
                 is_inline: bool,
                 /// Cache of (head_revisions, filtered_revisions)
                 ///
                 /// The head revisions in this index, kept in sync. Should
                 /// be accessed via the [`Self::head_revs`] method.
                 /// The last filtered revisions in this index, used to make sure
                 /// we haven't changed filters when returning the cached `head_revs`.
                 head_revs: RwLock<(Vec<Revision>, HashSet<Revision>)>,
             }
             impl Debug for Index {
                 fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
                     f.debug_struct("Index")
                         .field("offsets", &self.offsets)
                         .field("uses_generaldelta", &self.uses_generaldelta)
                         .finish()
                 }
             }
             impl Graph for Index {
                 #[inline(always)]
                 fn parents(&self, rev: Revision) -> Result<[Revision; 2], GraphError> {
                     let err = || GraphError::ParentOutOfRange(rev);
                     match self.get_entry(rev) {
                         Some(entry) => {
                             // The C implementation checks that the parents are valid
                             // before returning
                             Ok([
                                 self.check_revision(entry.p1()).ok_or_else(err)?,
                                 self.check_revision(entry.p2()).ok_or_else(err)?,
                             ])
                         }
                         None => Ok([NULL_REVISION, NULL_REVISION]),
                     }
                 }
             }
             /// A cache suitable for find_snapshots
             ///
             /// Logically equivalent to a mapping whose keys are [`BaseRevision`] and
             /// values sets of [`BaseRevision`]
             ///
             /// TODO the dubious part is insisting that errors must be RevlogError
             /// we would probably need to sprinkle some magic here, such as an associated
             /// type that would be Into<RevlogError> but even that would not be
             /// satisfactory, as errors potentially have nothing to do with the revlog.
             pub trait SnapshotsCache {
                 fn insert_for(
                     &mut self,
                     rev: BaseRevision,
                     value: BaseRevision,
                 ) -> Result<(), RevlogError>;
             }
             impl SnapshotsCache for FastHashMap<BaseRevision, HashSet<BaseRevision>> {
                 fn insert_for(
                     &mut self,
                     rev: BaseRevision,
                     value: BaseRevision,
                 ) -> Result<(), RevlogError> {
                     let all_values = self.entry(rev).or_default();
                     all_values.insert(value);
                     Ok(())
                 }
             }
             impl Index {
                 /// Create an index from bytes.
                 /// Calculate the start of each entry when is_inline is true.
                 pub fn new(
                     bytes: Box<dyn Deref<Target = [u8]> + Send + Sync>,
                     default_header: IndexHeader,
                 ) -> Result<Self, HgError> {
                     let header =
                         IndexHeader::parse(bytes.as_ref())?.unwrap_or(default_header);
                     if header.format_version() != IndexHeader::REVLOGV1 {
                         // A proper new version should have had a repo/store
                         // requirement.
                         return Err(HgError::corrupted("unsupported revlog version"));
                     }
                     let uses_generaldelta = header.format_flags().uses_generaldelta();
                     if header.format_flags().is_inline() {
                         let mut offset: usize = 0;
                         let mut offsets = Vec::new();
                         while offset + INDEX_ENTRY_SIZE <= bytes.len() {
                             offsets.push(offset);
                             let end = offset + INDEX_ENTRY_SIZE;
                             let entry = IndexEntry {
                                 bytes: &bytes[offset..end],
                             };
                             offset += INDEX_ENTRY_SIZE + entry.compressed_len() as usize;
                         }
                         if offset == bytes.len() {
                             Ok(Self {
                                 bytes: IndexData::new(bytes),
                                 offsets: RwLock::new(Some(offsets)),
                                 uses_generaldelta,
                                 is_inline: true,
                                 head_revs: RwLock::new((vec![], HashSet::new())),
                             })
                         } else {
                             Err(HgError::corrupted("unexpected inline revlog length"))
                         }
                     } else {
                         Ok(Self {
                             bytes: IndexData::new(bytes),
                             offsets: RwLock::new(None),
                             uses_generaldelta,
                             is_inline: false,
                             head_revs: RwLock::new((vec![], HashSet::new())),
                         })
                     }
                 }
                 pub fn uses_generaldelta(&self) -> bool {
                     self.uses_generaldelta
                 }
                 /// Value of the inline flag.
                 pub fn is_inline(&self) -> bool {
                     self.is_inline
                 }
                 /// Return a slice of bytes if `revlog` is inline. Panic if not.
                 pub fn data(&self, start: usize, end: usize) -> &[u8] {
                     if !self.is_inline() {
                         panic!("tried to access data in the index of a revlog that is not inline");
                     }
                     &self.bytes[start..end]
                 }
                 /// Return number of entries of the revlog index.
                 pub fn len(&self) -> usize {
                     if self.is_inline() {
                         (*self.get_offsets())
                             .as_ref()
                             .expect("inline should have offsets")
                             .len()
                     } else {
                         self.bytes.len() / INDEX_ENTRY_SIZE
                     }
                 }
                 pub fn get_offsets(&self) -> RwLockReadGuard<Option<Vec<usize>>> {
                     assert!(self.is_inline());
                     {
                         // Wrap in a block to drop the read guard
                         let mut offsets = self.offsets.write().unwrap();
                         if offsets.is_none() {
                             offsets.replace(inline_scan(&self.bytes.bytes).1);
                         }
                     }
                     self.offsets.read().unwrap()
                 }
                 pub fn get_offsets_mut(&mut self) -> RwLockWriteGuard<Option<Vec<usize>>> {
                     assert!(self.is_inline());
                     let mut offsets = self.offsets.write().unwrap();
                     if offsets.is_none() {
                         offsets.replace(inline_scan(&self.bytes.bytes).1);
                     }
                     offsets
                 }
                 /// Returns `true` if the `Index` has zero `entries`.
                 pub fn is_empty(&self) -> bool {
                     self.len() == 0
                 }
                 /// Return the index entry corresponding to the given revision or `None`
                 /// for [`NULL_REVISION`]
                 ///
                 /// The specified revision being of the checked type, it always exists
                 /// if it was validated by this index.
                 pub fn get_entry(&self, rev: Revision) -> Option<IndexEntry> {
                     if rev == NULL_REVISION {
                         return None;
                     }
                     if rev.0 == 0 {
                         Some(IndexEntry {
                             bytes: &self.bytes.first_entry[..],
                         })
                     } else {
                         Some(if self.is_inline() {
                             self.get_entry_inline(rev)
                         } else {
                             self.get_entry_separated(rev)
                         })
                     }
                 }
                 /// Return the binary content of the index entry for the given revision
                 ///
                 /// See [get_entry()](`Self::get_entry()`) for cases when `None` is
                 /// returned.
                 pub fn entry_binary(&self, rev: Revision) -> Option<&[u8]> {
                     self.get_entry(rev).map(|e| {
                         let bytes = e.as_bytes();
                         if rev.0 == 0 {
                             &bytes[4..]
                         } else {
                             bytes
                         }
                     })
                 }
                 pub fn entry_as_params(
                     &self,
                     rev: UncheckedRevision,
                 ) -> Option<RevisionDataParams> {
                     let rev = self.check_revision(rev)?;
                     self.get_entry(rev).map(|e| RevisionDataParams {
                         flags: e.flags(),
                         data_offset: if rev.0 == 0 && !self.bytes.is_new() {
                             e.flags() as u64
                         } else {
                             e.raw_offset()
                         },
                         data_compressed_length: e
                             .compressed_len()
                             .try_into()
                             .unwrap_or_else(|_| {
                                 // Python's `unionrepo` sets the compressed length to be
                                 // `-1` (or `u32::MAX` if transmuted to `u32`) because it
                                 // cannot know the correct compressed length of a given
                                 // revision. I'm not sure if this is true, but having this
                                 // edge case won't hurt other use cases, let's handle it.
                                 assert_eq!(e.compressed_len(), u32::MAX);
                                 NULL_REVISION.0
                             }),
                         data_uncompressed_length: e.uncompressed_len(),
                         data_delta_base: e.base_revision_or_base_of_delta_chain().0,
                         link_rev: e.link_revision().0,
                         parent_rev_1: e.p1().0,
                         parent_rev_2: e.p2().0,
                         node_id: e.hash().as_bytes().try_into().unwrap(),
                         ..Default::default()
                     })
                 }
                 fn get_entry_inline(&self, rev: Revision) -> IndexEntry {
                     let offsets = &self.get_offsets();
                     let offsets = offsets.as_ref().expect("inline should have offsets");
                     let start = offsets[rev.0 as usize];
                     let end = start + INDEX_ENTRY_SIZE;
                     let bytes = &self.bytes[start..end];
                     IndexEntry { bytes }
                 }
                 fn get_entry_separated(&self, rev: Revision) -> IndexEntry {
                     let start = rev.0 as usize * INDEX_ENTRY_SIZE;
                     let end = start + INDEX_ENTRY_SIZE;
                     let bytes = &self.bytes[start..end];
                     IndexEntry { bytes }
                 }
                 fn null_entry(&self) -> IndexEntry {
                     IndexEntry {
                         bytes: &[0; INDEX_ENTRY_SIZE],
                     }
                 }
                 /// Return the head revisions of this index
                 pub fn head_revs(&self) -> Result<Vec<Revision>, GraphError> {
                     self.head_revs_filtered(&HashSet::new(), false)
                         .map(|h| h.unwrap())
                 }
                 /// Python-specific shortcut to save on PyList creation
                 pub fn head_revs_shortcut(
                     &self,
                 ) -> Result<Option<Vec<Revision>>, GraphError> {
                     self.head_revs_filtered(&HashSet::new(), true)
                 }
                 /// Return the heads removed and added by advancing from `begin` to `end`.
                 /// In revset language, we compute:
                 /// - `heads(:begin)-heads(:end)`
                 /// - `heads(:end)-heads(:begin)`
                 pub fn head_revs_diff(
                     &self,
                     begin: Revision,
                     end: Revision,
                 ) -> Result<(Vec<Revision>, Vec<Revision>), GraphError> {
                     let mut heads_added = vec![];
                     let mut heads_removed = vec![];
                     let mut acc = HashSet::new();
                     let Revision(begin) = begin;
                     let Revision(end) = end;
                     let mut i = end;
                     while i > begin {
                         // acc invariant:
                         // `j` is in the set iff `j <= i` and it has children
                         // among `i+1..end` (inclusive)
                         if !acc.remove(&i) {
                             heads_added.push(Revision(i));
                         }
                         for Revision(parent) in self.parents(Revision(i))? {
                             acc.insert(parent);
                         }
                         i -= 1;
                     }
                     // At this point `acc` contains old revisions that gained new children.
                     // We need to check if they had any children before. If not, those
                     // revisions are the removed heads.
                     while !acc.is_empty() {
                         // acc invariant:
                         // `j` is in the set iff `j <= i` and it has children
                         // among `begin+1..end`, but not among `i+1..begin` (inclusive)
                         assert!(i >= -1); // yes, `-1` can also be a head if the repo is empty
                         if acc.remove(&i) {
                             heads_removed.push(Revision(i));
                         }
                         for Revision(parent) in self.parents(Revision(i))? {
                             acc.remove(&parent);
                         }
                         i -= 1;
                     }
                     Ok((heads_removed, heads_added))
                 }
                 /// Return the head revisions of this index
                 pub fn head_revs_filtered(
                     &self,
                     filtered_revs: &HashSet<Revision>,
                     py_shortcut: bool,
                 ) -> Result<Option<Vec<Revision>>, GraphError> {
                     {
                         let guard = self
                             .head_revs
                             .read()
                             .expect("RwLock on Index.head_revs should not be poisoned");
                         let self_head_revs = &guard.0;
                         let self_filtered_revs = &guard.1;
                         if !self_head_revs.is_empty()
                             && filtered_revs == self_filtered_revs
                         {
                             if py_shortcut {
                                 // Don't copy the revs since we've already cached them
                                 // on the Python side.
                                 return Ok(None);
                             } else {
                                 return Ok(Some(self_head_revs.to_owned()));
                             }
                         }
                     }
                     let as_vec = if self.is_empty() {
                         vec![NULL_REVISION]
                     } else {
                         let mut not_heads = bitvec![0; self.len()];
                         dagops::retain_heads_fast(
                             self,
                             not_heads.as_mut_bitslice(),
                             filtered_revs,
                         )?;
                         not_heads
                             .into_iter()
                             .enumerate()
                             .filter_map(|(idx, is_not_head)| {
                                 if is_not_head {
                                     None
                                 } else {
                                     Some(Revision(idx as BaseRevision))
                                 }
                             })
                             .collect()
                     };
                     *self
                         .head_revs
                         .write()
                         .expect("RwLock on Index.head_revs should not be poisoned") =
                         (as_vec.to_owned(), filtered_revs.to_owned());
                     Ok(Some(as_vec))
                 }
                 /// Obtain the delta chain for a revision.
                 ///
                 /// `stop_rev` specifies a revision to stop at. If not specified, we
                 /// stop at the base of the chain.
                 ///
                 /// Returns a 2-tuple of (chain, stopped) where `chain` is a vec of
                 /// revs in ascending order and `stopped` is a bool indicating whether
                 /// `stoprev` was hit.
                 pub fn delta_chain(
                     &self,
                     rev: Revision,
                     stop_rev: Option<Revision>,
                     using_general_delta: Option<bool>,
                 ) -> Result<(Vec<Revision>, bool), HgError> {
                     let mut current_rev = rev;
                     let mut entry = self.get_entry(rev).unwrap();
                     let mut chain = vec![];
                     let using_general_delta =
                         using_general_delta.unwrap_or_else(|| self.uses_generaldelta());
                     while current_rev.0 != entry.base_revision_or_base_of_delta_chain().0
                         && stop_rev.map(|r| r != current_rev).unwrap_or(true)
                     {
                         chain.push(current_rev);
                         let new_rev = if using_general_delta {
                             entry.base_revision_or_base_of_delta_chain()
                         } else {
                             UncheckedRevision(current_rev.0 - 1)
                         };
                         current_rev = self.check_revision(new_rev).ok_or_else(|| {
                             HgError::corrupted(format!("Revision {new_rev} out of range"))
                         })?;
                         if current_rev.0 == NULL_REVISION.0 {
                             break;
                         }
                         entry = self.get_entry(current_rev).unwrap()
                     }
                     let stopped = if stop_rev.map(|r| current_rev == r).unwrap_or(false) {
                         true
                     } else {
                         chain.push(current_rev);
                         false
                     };
                     chain.reverse();
                     Ok((chain, stopped))
                 }
                 pub fn find_snapshots(
                     &self,
                     start_rev: UncheckedRevision,
                     end_rev: UncheckedRevision,
                     cache: &mut impl SnapshotsCache,
                 ) -> Result<(), RevlogError> {
                     let mut start_rev = start_rev.0;
                     let mut end_rev = end_rev.0;
                     end_rev += 1;
                     let len = self.len().try_into().unwrap();
                     if end_rev > len {
                         end_rev = len;
                     }
                     if start_rev < 0 {
                         start_rev = 0;
                     }
                     for rev in start_rev..end_rev {
                         if !self.is_snapshot_unchecked(Revision(rev))? {
                             continue;
                         }
                         let mut base = self
                             .get_entry(Revision(rev))
                             .unwrap()
                             .base_revision_or_base_of_delta_chain();
                         if base.0 == rev {
                             base = NULL_REVISION.into();
                         }
                         cache.insert_for(base.0, rev)?;
                     }
                     Ok(())
                 }
                 fn clear_head_revs(&self) {
                     self.head_revs
                         .write()
                         .expect("RwLock on Index.head_revs should not be poisoined")
                         .0
                         .clear()
                 }
                 /// TODO move this to the trait probably, along with other things
                 pub fn append(
                     &mut self,
                     revision_data: RevisionDataParams,
                 ) -> Result<(), RevlogError> {
                     revision_data.validate()?;
                     let entry_v1 = revision_data.into_v1();
                     let entry_bytes = entry_v1.as_bytes();
                     if self.bytes.len() == 0 {
                         self.bytes.first_entry[INDEX_HEADER_SIZE..].copy_from_slice(
                             &entry_bytes[INDEX_HEADER_SIZE..INDEX_ENTRY_SIZE],
                         )
                     }
                     if self.is_inline() {
                         let new_offset = self.bytes.len();
                         if let Some(offsets) = &mut *self.get_offsets_mut() {
                             offsets.push(new_offset)
                         }
                     }
                     self.bytes.added.extend(entry_bytes);
                     self.clear_head_revs();
                     Ok(())
                 }
                 pub fn pack_header(&self, header: i32) -> [u8; 4] {
                     header.to_be_bytes()
                 }
                 pub fn remove(&mut self, rev: Revision) -> Result<(), RevlogError> {
                     let offsets = if self.is_inline() {
                         self.get_offsets().clone()
                     } else {
                         None
                     };
                     self.bytes.remove(rev, offsets.as_deref())?;
                     if self.is_inline() {
                         if let Some(offsets) = &mut *self.get_offsets_mut() {
                             offsets.truncate(rev.0 as usize)
                         }
                     }
                     self.clear_head_revs();
                     Ok(())
                 }
                 pub fn clear_caches(&self) {
                     // We need to get the 'inline' value from Python at init and use this
                     // instead of offsets to determine whether we're inline since we might
                     // clear caches. This implies re-populating the offsets on-demand.
                     *self
                         .offsets
                         .write()
                         .expect("RwLock on Index.offsets should not be poisoed") = None;
                     self.clear_head_revs();
                 }
                 /// Unchecked version of `is_snapshot`.
                 /// Assumes the caller checked that `rev` is within a valid revision range.
                 pub fn is_snapshot_unchecked(
                     &self,
                     mut rev: Revision,
                 ) -> Result<bool, RevlogError> {
                     while rev.0 >= 0 {
                         let entry = self.get_entry(rev).unwrap();
                         let mut base = entry.base_revision_or_base_of_delta_chain().0;
                         if base == rev.0 {
                             base = NULL_REVISION.0;
                         }
                         if base == NULL_REVISION.0 {
                             return Ok(true);
                         }
                         let [mut p1, mut p2] = self
                             .parents(rev)
                             .map_err(|_| RevlogError::InvalidRevision)?;
                         while let Some(p1_entry) = self.get_entry(p1) {
                             if p1_entry.compressed_len() != 0 || p1.0 == 0 {
                                 break;
                             }
                             let parent_base =
                                 p1_entry.base_revision_or_base_of_delta_chain();
                             if parent_base.0 == p1.0 {
                                 break;
                             }
                             p1 = self
                                 .check_revision(parent_base)
                                 .ok_or(RevlogError::InvalidRevision)?;
                         }
                         while let Some(p2_entry) = self.get_entry(p2) {
                             if p2_entry.compressed_len() != 0 || p2.0 == 0 {
                                 break;
                             }
                             let parent_base =
                                 p2_entry.base_revision_or_base_of_delta_chain();
                             if parent_base.0 == p2.0 {
                                 break;
                             }
                             p2 = self
                                 .check_revision(parent_base)
                                 .ok_or(RevlogError::InvalidRevision)?;
                         }
                         if base == p1.0 || base == p2.0 {
                             return Ok(false);
                         }
                         rev = self
                             .check_revision(base.into())
                             .ok_or(RevlogError::InvalidRevision)?;
                     }
                     Ok(rev == NULL_REVISION)
                 }
                 /// Return whether the given revision is a snapshot. Returns an error if
                 /// `rev` is not within a valid revision range.
                 pub fn is_snapshot(
                     &self,
                     rev: UncheckedRevision,
                 ) -> Result<bool, RevlogError> {
                     let rev = self
                         .check_revision(rev)
                         .ok_or_else(|| RevlogError::corrupted("test"))?;
                     self.is_snapshot_unchecked(rev)
                 }
                 /// Slice revs to reduce the amount of unrelated data to be read from disk.
                 ///
                 /// The index is sliced into groups that should be read in one time.
                 ///
                 /// The initial chunk is sliced until the overall density
                 /// (payload/chunks-span ratio) is above `target_density`.
                 /// No gap smaller than `min_gap_size` is skipped.
                 pub fn slice_chunk_to_density(
                     &self,
                     revs: &[Revision],
                     target_density: f64,
                     min_gap_size: usize,
                 ) -> Vec<Vec<Revision>> {
                     if revs.is_empty() {
                         return vec![];
                     }
                     if revs.len() == 1 {
                         return vec![revs.to_owned()];
                     }
                     let delta_chain_span = self.segment_span(revs);
                     if delta_chain_span < min_gap_size {
                         return vec![revs.to_owned()];
                     }
                     let entries: Vec<_> = revs
                         .iter()
                         .map(|r| {
                             (*r, self.get_entry(*r).unwrap_or_else(|| self.null_entry()))
                         })
                         .collect();
                     let mut read_data = delta_chain_span;
                     let chain_payload: u32 =
                         entries.iter().map(|(_r, e)| e.compressed_len()).sum();
                     let mut density = if delta_chain_span > 0 {
                         chain_payload as f64 / delta_chain_span as f64
                     } else {
 .0
                     };
                     if density >= target_density {
                         return vec![revs.to_owned()];
                     }
                     // Store the gaps in a heap to have them sorted by decreasing size
                     let mut gaps = Vec::new();
                     let mut previous_end = None;
                     for (i, (_rev, entry)) in entries.iter().enumerate() {
                         let start = entry.c_start() as usize;
                         let length = entry.compressed_len();
                         // Skip empty revisions to form larger holes
                         if length == 0 {
                             continue;
                         }
                         if let Some(end) = previous_end {
                             let gap_size = start - end;
                             // Only consider holes that are large enough
                             if gap_size > min_gap_size {
                                 gaps.push((gap_size, i));
                             }
                         }
                         previous_end = Some(start + length as usize);
                     }
                     if gaps.is_empty() {
                         return vec![revs.to_owned()];
                     }
                     // sort the gaps to pop them from largest to small
                     gaps.sort_unstable();
                     // Collect the indices of the largest holes until
                     // the density is acceptable
                     let mut selected = vec![];
                     while let Some((gap_size, gap_id)) = gaps.pop() {
                         if density >= target_density {
                             break;
                         }
                         selected.push(gap_id);
                         // The gap sizes are stored as negatives to be sorted decreasingly
                         // by the heap
                         read_data -= gap_size;
                         density = if read_data > 0 {
                             chain_payload as f64 / read_data as f64
                         } else {
 .0
                         };
                         if density >= target_density {
                             break;
                         }
                     }
                     selected.sort_unstable();
                     selected.push(revs.len());
                     // Cut the revs at collected indices
                     let mut previous_idx = 0;
                     let mut chunks = vec![];
                     for idx in selected {
                         let chunk = self.trim_chunk(&entries, previous_idx, idx);
                         if !chunk.is_empty() {
                             chunks.push(chunk.iter().map(|(rev, _entry)| *rev).collect());
                         }
                         previous_idx = idx;
                     }
                     let chunk = self.trim_chunk(&entries, previous_idx, entries.len());
                     if !chunk.is_empty() {
                         chunks.push(chunk.iter().map(|(rev, _entry)| *rev).collect());
                     }
                     chunks
                 }
                 /// Get the byte span of a segment of sorted revisions.
                 ///
                 /// Occurrences of [`NULL_REVISION`] are ignored at the beginning of
                 /// the `revs` segment.
                 ///
                 /// panics:
                 ///  - if `revs` is empty or only made of `NULL_REVISION`
                 ///  - if cannot retrieve entry for the last or first not null element of
                 ///    `revs`.
                 fn segment_span(&self, revs: &[Revision]) -> usize {
                     if revs.is_empty() {
                         return 0;
                     }
                     let last_entry = &self.get_entry(revs[revs.len() - 1]).unwrap();
                     let end = last_entry.c_start() + last_entry.compressed_len() as u64;
                     let first_rev = revs.iter().find(|r| r.0 != NULL_REVISION.0).unwrap();
                     let start = if first_rev.0 == 0 {
                     } else {
                         self.get_entry(*first_rev).unwrap().c_start()
                     };
                     (end - start) as usize
                 }
                 /// Returns `&revs[startidx..endidx]` without empty trailing revs
                 fn trim_chunk<'a>(
                     &'a self,
                     revs: &'a [(Revision, IndexEntry)],
                     start: usize,
                     mut end: usize,
                 ) -> &'a [(Revision, IndexEntry)] {
                     // Trim empty revs at the end, except the very first rev of a chain
                     let last_rev = revs[end - 1].0;
                     if last_rev.0 < self.len() as BaseRevision {
                         while end > 1
                             && end > start
                             && revs[end - 1].1.compressed_len() == 0
                         {
                             end -= 1
                         }
                     }
                     &revs[start..end]
                 }
                 /// Computes the set of revisions for each non-public phase from `roots`,
                 /// which are the last known roots for each non-public phase.
                 pub fn compute_phases_map_sets(
                     &self,
                     roots: HashMap<Phase, Vec<Revision>>,
                 ) -> Result<(usize, RootsPerPhase), GraphError> {
                     let mut phases = vec![Phase::Public; self.len()];
                     let mut min_phase_rev = NULL_REVISION;
                     for phase in Phase::non_public_phases() {
                         if let Some(phase_roots) = roots.get(phase) {
                             let min_rev =
                                 self.add_roots_get_min(phase_roots, &mut phases, *phase);
                             if min_rev != NULL_REVISION
                                 && (min_phase_rev == NULL_REVISION
                                     || min_rev < min_phase_rev)
                             {
                                 min_phase_rev = min_rev;
                             }
                         } else {
                             continue;
                         };
                     }
                     let mut phase_sets: RootsPerPhase = Default::default();
                     if min_phase_rev == NULL_REVISION {
                         min_phase_rev = Revision(self.len() as BaseRevision);
                     }
                     for rev in min_phase_rev.0..self.len() as BaseRevision {
                         let rev = Revision(rev);
                         let [p1, p2] = self.parents(rev)?;
                         if p1.0 >= 0 && phases[p1.0 as usize] > phases[rev.0 as usize] {
                             phases[rev.0 as usize] = phases[p1.0 as usize];
                         }
                         if p2.0 >= 0 && phases[p2.0 as usize] > phases[rev.0 as usize] {
                             phases[rev.0 as usize] = phases[p2.0 as usize];
                         }
                         let set = match phases[rev.0 as usize] {
                             Phase::Public => continue,
                             phase => &mut phase_sets[phase as usize - 1],
                         };
                         set.push(rev);
                     }
                     Ok((self.len(), phase_sets))
                 }
                 fn add_roots_get_min(
                     &self,
                     phase_roots: &[Revision],
                     phases: &mut [Phase],
                     phase: Phase,
                 ) -> Revision {
                     let mut min_rev = NULL_REVISION;
                     for root in phase_roots {
                         phases[root.0 as usize] = phase;
                         if min_rev == NULL_REVISION || min_rev > *root {
                             min_rev = *root;
                         }
                     }
                     min_rev
                 }
                 /// Return `(heads(::(<roots> and <roots>::<heads>)))`
                 /// If `include_path` is `true`, return `(<roots>::<heads>)`."""
                 ///
                 /// `min_root` and `roots` are unchecked since they are just used as
                 /// a bound or for comparison and don't need to represent a valid revision.
                 /// In practice, the only invalid revision passed is the working directory
                 /// revision ([`i32::MAX`]).
                 pub fn reachable_roots(
                     &self,
                     min_root: UncheckedRevision,
                     mut heads: Vec<Revision>,
                     roots: HashSet<UncheckedRevision>,
                     include_path: bool,
                 ) -> Result<HashSet<Revision>, GraphError> {
                     if roots.is_empty() {
                         return Ok(HashSet::new());
                     }
                     let mut reachable = HashSet::new();
                     let mut seen = HashMap::new();
                     while let Some(rev) = heads.pop() {
                         if roots.contains(&rev.into()) {
                             reachable.insert(rev);
                             if !include_path {
                                 continue;
                             }
                         }
                         let parents = self.parents(rev)?;
                         seen.insert(rev, parents);
                         for parent in parents {
                             if parent.0 >= min_root.0 && !seen.contains_key(&parent) {
                                 heads.push(parent);
                             }
                         }
                     }
                     if !include_path {
                         return Ok(reachable);
                     }
                     let mut revs: Vec<_> = seen.keys().collect();
                     revs.sort_unstable();
                     for rev in revs {
                         for parent in seen[rev] {
                             if reachable.contains(&parent) {
                                 reachable.insert(*rev);
                             }
                         }
                     }
                     Ok(reachable)
                 }
                 /// Given a (possibly overlapping) set of revs, return all the
                 /// common ancestors heads: `heads(::args[0] and ::a[1] and ...)`
                 pub fn common_ancestor_heads(
                     &self,
                     revisions: &[Revision],
                 ) -> Result<Vec<Revision>, GraphError> {
                     // given that revisions is expected to be small, we find this shortcut
                     // potentially acceptable, especially given that `hg-cpython` could
                     // very much bypass this, constructing a vector of unique values from
                     // the onset.
                     let as_set: HashSet<Revision> = revisions.iter().copied().collect();
                     // Besides deduplicating, the C version also implements the shortcut
                     // for `NULL_REVISION`:
                     if as_set.contains(&NULL_REVISION) {
                         return Ok(vec![]);
                     }
                     let revisions: Vec<Revision> = as_set.into_iter().collect();
                     if revisions.len() < 8 {
                         self.find_gca_candidates::<u8>(&revisions)
                     } else if revisions.len() < 64 {
                         self.find_gca_candidates::<u64>(&revisions)
                     } else {
                         self.find_gca_candidates::<NonStaticPoisonableBitSet>(&revisions)
                     }
                 }
                 pub fn ancestors(
                     &self,
                     revisions: &[Revision],
                 ) -> Result<Vec<Revision>, GraphError> {
                     self.find_deepest_revs(&self.common_ancestor_heads(revisions)?)
                 }
                 /// Given a disjoint set of revs, return all candidates for the
                 /// greatest common ancestor. In revset notation, this is the set
                 /// `heads(::a and ::b and ...)`
                 fn find_gca_candidates<BS: PoisonableBitSet + Clone>(
                     &self,
                     revs: &[Revision],
                 ) -> Result<Vec<Revision>, GraphError> {
                     if revs.is_empty() {
                         return Ok(vec![]);
                     }
                     let revcount = revs.len();
                     let mut candidates = vec![];
                     let max_rev = revs.iter().max().unwrap();
                     let mut seen = BS::vec_of_empty(revs.len(), (max_rev.0 + 1) as usize);
                     for (idx, rev) in revs.iter().enumerate() {
                         seen[rev.0 as usize].add(idx);
                     }
                     let mut current_rev = *max_rev;
                     // Number of revisions whose inspection in the main loop
                     // will give a result or trigger inspection of other revisions
                     let mut interesting = revcount;
                     // The algorithm works on a vector of bit sets, indexed by revision
                     // numbers and iterated on reverse order.
                     // An entry in this vector is poisoned if and only if the corresponding
                     // revision is a common, yet not maximal ancestor.
                     // The principle of the algorithm is as follows:
                     // For a revision `r`, when entering the loop, `seen[r]` is either
                     // poisoned or the sub set of `revs` of which `r` is an ancestor.
                     // In this sub set is full, then `r` is a solution and its parents
                     // have to be poisoned.
                     //
                     // At each iteration, the bit sets of the parents are updated by
                     // union with `seen[r]`.
                     // As we walk the index from the end, we are sure we have encountered
                     // all children of `r` before `r`, hence we know that `seen[r]` is
                     // fully computed.
                     //
                     // On top of that there are several optimizations that make reading
                     // less obvious than the comment above:
                     // - The `interesting` counter allows to break early
                     // - The loop starts from `max(revs)`
                     // - Early return in case it is detected that one of the incoming revs
                     //   is a common ancestor of all of them.
                     while current_rev.0 >= 0 && interesting > 0 {
                         let current_seen = seen[current_rev.0 as usize].clone();
                         if current_seen.is_empty() {
                             current_rev = Revision(current_rev.0 - 1);
                             continue;
                         }
                         let mut poison = current_seen.is_poisoned();
                         if !poison {
                             interesting -= 1;
                             if current_seen.is_full_range(revcount) {
                                 candidates.push(current_rev);
                                 poison = true;
                                 // Being a common ancestor, if `current_rev` is among
                                 // the input revisions, it is *the* answer.
                                 for rev in revs {
                                     if *rev == current_rev {
                                         return Ok(candidates);
                                     }
                                 }
                             }
                         }
                         for parent in self.parents(current_rev)? {
                             if parent == NULL_REVISION {
                                 continue;
                             }
                             let parent_seen = &mut seen[parent.0 as usize];
                             if poison {
                                 // this block is logically equivalent to poisoning parent
                                 // and counting it as non interesting if it
                                 // has been seen before (hence counted then as interesting)
                                 if !parent_seen.is_empty() && !parent_seen.is_poisoned() {
                                     interesting -= 1;
                                 }
                                 parent_seen.poison();
                             } else {
                                 if parent_seen.is_empty() {
                                     interesting += 1;
                                 }
                                 parent_seen.union(&current_seen);
                             }
                         }
                         current_rev = Revision(current_rev.0 - 1);
                     }
                     Ok(candidates)
                 }
                 /// Given a disjoint set of revs, return the subset with the longest path
                 /// to the root.
                 fn find_deepest_revs(
                     &self,
                     revs: &[Revision],
                 ) -> Result<Vec<Revision>, GraphError> {
                     // TODO replace this all with just comparing rank?
                     // Also, the original implementations in C/Python are cryptic, not
                     // even sure we actually need this?
                     if revs.len() <= 1 {
                         return Ok(revs.to_owned());
                     }
                     let max_rev = revs.iter().max().unwrap().0;
                     let mut interesting = HashMap::new();
                     let mut seen = vec![0; max_rev as usize + 1];
                     let mut depth = vec![0; max_rev as usize + 1];
                     let mut mapping = vec![];
                     let mut revs = revs.to_owned();
                     revs.sort_unstable();
                     for (idx, rev) in revs.iter().enumerate() {
                         depth[rev.0 as usize] = 1;
                         let shift = 1 << idx;
                         seen[rev.0 as usize] = shift;
                         interesting.insert(shift, 1);
                         mapping.push((shift, *rev));
                     }
                     let mut current_rev = Revision(max_rev);
                     while current_rev.0 >= 0 && interesting.len() > 1 {
                         let current_depth = depth[current_rev.0 as usize];
                         if current_depth == 0 {
                             current_rev = Revision(current_rev.0 - 1);
                             continue;
                         }
                         let current_seen = seen[current_rev.0 as usize];
                         for parent in self.parents(current_rev)? {
                             if parent == NULL_REVISION {
                                 continue;
                             }
                             let parent_seen = seen[parent.0 as usize];
                             let parent_depth = depth[parent.0 as usize];
                             if parent_depth <= current_depth {
                                 depth[parent.0 as usize] = current_depth + 1;
                                 if parent_seen != current_seen {
                                     *interesting.get_mut(&current_seen).unwrap() += 1;
                                     seen[parent.0 as usize] = current_seen;
                                     if parent_seen != 0 {
                                         let parent_interesting =
                                             interesting.get_mut(&parent_seen).unwrap();
                                         *parent_interesting -= 1;
                                         if *parent_interesting == 0 {
                                             interesting.remove(&parent_seen);
                                         }
                                     }
                                 }
                             } else if current_depth == parent_depth - 1 {
                                 let either_seen = parent_seen | current_seen;
                                 if either_seen == parent_seen {
                                     continue;
                                 }
                                 seen[parent.0 as usize] = either_seen;
                                 interesting
                                     .entry(either_seen)
                                     .and_modify(|v| *v += 1)
                                     .or_insert(1);
                                 *interesting.get_mut(&parent_seen).unwrap() -= 1;
                                 if interesting[&parent_seen] == 0 {
                                     interesting.remove(&parent_seen);
                                 }
                             }
                         }
                         *interesting.get_mut(&current_seen).unwrap() -= 1;
                         if interesting[&current_seen] == 0 {
                             interesting.remove(&current_seen);
                         }
                         current_rev = Revision(current_rev.0 - 1);
                     }
                     if interesting.len() != 1 {
                         return Ok(vec![]);
                     }
                     let mask = interesting.keys().next().unwrap();
                     Ok(mapping
                         .into_iter()
                         .filter_map(|(shift, rev)| {
                             if (mask & shift) != 0 {
                                 return Some(rev);
                             }
                             None
                         })
                         .collect())
                 }
             }
             /// The kind of functionality needed by find_gca_candidates
             ///
             /// This is a bit mask which can be declared to be "poisoned", which callers
             /// interpret to break out of some loops.
             ///
             /// The maximum capacity of the bit mask is up to the actual implementation
             trait PoisonableBitSet: Sized + PartialEq {
                 /// Return a vector of exactly n elements, initialized to be empty.
                 ///
                 /// Optimization can vastly depend on implementation. Those being `Copy`
                 /// and having constant capacity typically can have a very simple
                 /// implementation.
                 fn vec_of_empty(sets_size: usize, vec_len: usize) -> Vec<Self>;
                 /// The size of the bit mask in memory
                 #[allow(unused)]
                 fn size(&self) -> usize;
                 /// The number of elements that can be represented in the set.
                 ///
                 /// Another way to put it is that it is the highest integer `C` such that
                 /// the set is guaranteed to always be a subset of the integer range
                 /// `[0, C)`
                 #[allow(unused)]
                 fn capacity(&self) -> usize;
                 /// Declare `n` to belong to the set
                 fn add(&mut self, n: usize);
                 /// Declare `n` not to belong to the set
                 #[allow(unused)]
                 fn discard(&mut self, n: usize);
                 /// Replace this bit set by its union with other
                 fn union(&mut self, other: &Self);
                 /// Poison the bit set
                 ///
                 /// Interpretation up to the caller
                 fn poison(&mut self);
                 /// Is the bit set poisoned?
                 ///
                 /// Interpretation is up to the caller
                 fn is_poisoned(&self) -> bool;
                 /// Is the bit set empty?
                 fn is_empty(&self) -> bool;
                 /// return `true` if and only if the bit is the full range `[0, n)`
                 /// of integers
                 fn is_full_range(&self, n: usize) -> bool;
             }
             const U64_POISON: u64 = 1 << 63;
             const U8_POISON: u8 = 1 << 7;
             impl PoisonableBitSet for u64 {
                 fn vec_of_empty(_sets_size: usize, vec_len: usize) -> Vec<Self> {
                     vec![0u64; vec_len]
                 }
                 fn size(&self) -> usize {
                 }
                 fn capacity(&self) -> usize {
                 }
                 fn add(&mut self, n: usize) {
                     (*self) |= 1u64 << n;
                 }
                 fn discard(&mut self, n: usize) {
                     (*self) &= u64::MAX - (1u64 << n);
                 }
                 fn union(&mut self, other: &Self) {
                     if *self != *other {
                         (*self) |= *other;
                     }
                 }
                 fn is_full_range(&self, n: usize) -> bool {
                     *self + 1 == (1u64 << n)
                 }
                 fn is_empty(&self) -> bool {
                     *self == 0
                 }
                 fn poison(&mut self) {
                     *self = U64_POISON;
                 }
                 fn is_poisoned(&self) -> bool {
                     // equality comparison would be tempting but would not resist
                     // operations after poisoning (even if these should be bogus).
                     *self >= U64_POISON
                 }
             }
             impl PoisonableBitSet for u8 {
                 fn vec_of_empty(_sets_size: usize, vec_len: usize) -> Vec<Self> {
                     vec![0; vec_len]
                 }
                 fn size(&self) -> usize {
                 }
                 fn capacity(&self) -> usize {
                 }
                 fn add(&mut self, n: usize) {
                     (*self) |= 1 << n;
                 }
                 fn discard(&mut self, n: usize) {
                     (*self) &= u8::MAX - (1 << n);
                 }
                 fn union(&mut self, other: &Self) {
                     if *self != *other {
                         (*self) |= *other;
                     }
                 }
                 fn is_full_range(&self, n: usize) -> bool {
                     *self + 1 == (1 << n)
                 }
                 fn is_empty(&self) -> bool {
                     *self == 0
                 }
                 fn poison(&mut self) {
                     *self = U8_POISON;
                 }
                 fn is_poisoned(&self) -> bool {
                     // equality comparison would be tempting but would not resist
                     // operations after poisoning (even if these should be bogus).
                     *self >= U8_POISON
                 }
             }
             /// A poisonable bit set whose capacity is not known at compile time but
             /// is constant after initial construction
             ///
             /// This can be way further optimized if performance assessments (speed
             /// and/or RAM) require it.
             /// As far as RAM is concerned, for large vectors of these, the main problem
             /// would be the repetition of set_size in each item. We would need a trait
             /// to abstract over the idea of a vector of such bit sets to do better.
             #[derive(Clone, PartialEq)]
             struct NonStaticPoisonableBitSet {
                 set_size: usize,
                 bit_set: Vec<u64>,
             }
             /// Number of `u64` needed for a [`NonStaticPoisonableBitSet`] of given size
             fn non_static_poisonable_inner_len(set_size: usize) -> usize {
 + (set_size + 1) / 64
             }
             impl NonStaticPoisonableBitSet {
                 /// The index of the sub-bit set for the given n, and the index inside
                 /// the latter
                 fn index(&self, n: usize) -> (usize, usize) {
                     (n / 64, n % 64)
                 }
             }
             /// Mock implementation to ensure that the trait makes sense
             impl PoisonableBitSet for NonStaticPoisonableBitSet {
                 fn vec_of_empty(set_size: usize, vec_len: usize) -> Vec<Self> {
                     let tmpl = Self {
                         set_size,
                         bit_set: vec![0u64; non_static_poisonable_inner_len(set_size)],
                     };
                     vec![tmpl; vec_len]
                 }
                 fn size(&self) -> usize {
 + self.bit_set.len() * 8
                 }
                 fn capacity(&self) -> usize {
                     self.set_size
                 }
                 fn add(&mut self, n: usize) {
                     let (sub_bs, bit_pos) = self.index(n);
                     self.bit_set[sub_bs] |= 1 << bit_pos
                 }
                 fn discard(&mut self, n: usize) {
                     let (sub_bs, bit_pos) = self.index(n);
                     self.bit_set[sub_bs] |= u64::MAX - (1 << bit_pos)
                 }
                 fn union(&mut self, other: &Self) {
                     assert!(
                         self.set_size == other.set_size,
                         "Binary operations on bit sets can only be done on same size"
                     );
                     for i in 0..self.bit_set.len() - 1 {
                         self.bit_set[i] |= other.bit_set[i]
                     }
                 }
                 fn is_full_range(&self, n: usize) -> bool {
                     let (sub_bs, bit_pos) = self.index(n);
                     self.bit_set[..sub_bs].iter().all(|bs| *bs == u64::MAX)
                         && self.bit_set[sub_bs] == (1 << (bit_pos + 1)) - 1
                 }
                 fn is_empty(&self) -> bool {
                     self.bit_set.iter().all(|bs| *bs == 0u64)
                 }
                 fn poison(&mut self) {
                     let (sub_bs, bit_pos) = self.index(self.set_size);
                     self.bit_set[sub_bs] = 1 << bit_pos;
                 }
                 fn is_poisoned(&self) -> bool {
                     let (sub_bs, bit_pos) = self.index(self.set_size);
                     self.bit_set[sub_bs] >= 1 << bit_pos
                 }
             }
             /// Set of roots of all non-public phases
             pub type RootsPerPhase = [Vec<Revision>; Phase::non_public_phases().len()];
             #[derive(Debug, Copy, Clone, PartialEq, Eq, Ord, PartialOrd, Hash)]
             pub enum Phase {
                 Public = 0,
                 Draft = 1,
                 Secret = 2,
                 Archived = 3,
                 Internal = 4,
             }
             impl TryFrom<usize> for Phase {
                 type Error = RevlogError;
                 fn try_from(value: usize) -> Result<Self, Self::Error> {
                     Ok(match value {
 => Self::Public,
 => Self::Draft,
 => Self::Secret,
 => Self::Archived,
 => Self::Internal,
                         v => {
                             return Err(RevlogError::corrupted(format!(
                                 "invalid phase value {}",
                                 v
                             )))
                         }
                     })
                 }
             }
             impl Phase {
                 pub const fn all_phases() -> &'static [Self] {
                     &[
                         Self::Public,
                         Self::Draft,
                         Self::Secret,
                         Self::Archived,
                         Self::Internal,
                     ]
                 }
                 pub const fn non_public_phases() -> &'static [Self] {
                     &[Self::Draft, Self::Secret, Self::Archived, Self::Internal]
                 }
             }
             fn inline_scan(bytes: &[u8]) -> (usize, Vec<usize>) {
                 let mut offset: usize = 0;
                 let mut offsets = Vec::new();
                 while offset + INDEX_ENTRY_SIZE <= bytes.len() {
                     offsets.push(offset);
                     let end = offset + INDEX_ENTRY_SIZE;
                     let entry = IndexEntry {
                         bytes: &bytes[offset..end],
                     };
                     offset += INDEX_ENTRY_SIZE + entry.compressed_len() as usize;
                 }
                 (offset, offsets)
             }
             impl super::RevlogIndex for Index {
                 fn len(&self) -> usize {
                     self.len()
                 }
                 fn node(&self, rev: Revision) -> Option<&Node> {
                     if rev == NULL_REVISION {
                         return Some(&NULL_NODE);
                     }
                     self.get_entry(rev).map(|entry| entry.hash())
                 }
             }
             #[derive(Debug)]
             pub struct IndexEntry<'a> {
                 bytes: &'a [u8],
             }
             impl<'a> IndexEntry<'a> {
                 /// Return the offset of the data.
                 pub fn offset(&self) -> usize {
                     let mut bytes = [0; 8];
                     bytes[2..8].copy_from_slice(&self.bytes[0..=5]);
                     BigEndian::read_u64(&bytes[..]) as usize
                 }
                 pub fn raw_offset(&self) -> u64 {
                     BigEndian::read_u64(&self.bytes[0..8])
                 }
                 /// Same result (except potentially for rev 0) as C `index_get_start()`
                 fn c_start(&self) -> u64 {
                     self.raw_offset() >> 16
                 }
                 pub fn flags(&self) -> u16 {
                     BigEndian::read_u16(&self.bytes[6..=7])
                 }
                 /// Return the compressed length of the data.
                 pub fn compressed_len(&self) -> u32 {
                     BigEndian::read_u32(&self.bytes[8..=11])
                 }
                 /// Return the uncompressed length of the data.
                 pub fn uncompressed_len(&self) -> i32 {
                     BigEndian::read_i32(&self.bytes[12..=15])
                 }
                 /// Return the revision upon which the data has been derived.
                 pub fn base_revision_or_base_of_delta_chain(&self) -> UncheckedRevision {
                     // TODO Maybe return an Option when base_revision == rev?
                     //      Requires to add rev to IndexEntry
                     BigEndian::read_i32(&self.bytes[16..]).into()
                 }
                 pub fn link_revision(&self) -> UncheckedRevision {
                     BigEndian::read_i32(&self.bytes[20..]).into()
                 }
                 pub fn p1(&self) -> UncheckedRevision {
                     BigEndian::read_i32(&self.bytes[24..]).into()
                 }
                 pub fn p2(&self) -> UncheckedRevision {
                     BigEndian::read_i32(&self.bytes[28..]).into()
                 }
                 /// Return the hash of revision's full text.
                 ///
                 /// Currently, SHA-1 is used and only the first 20 bytes of this field
                 /// are used.
                 pub fn hash(&self) -> &'a Node {
                     (&self.bytes[32..52]).try_into().unwrap()
                 }
                 pub fn as_bytes(&self) -> &'a [u8] {
                     self.bytes
                 }
             }
             #[cfg(test)]
             pub use tests::IndexEntryBuilder;
             #[cfg(test)]
             mod tests {
                 use super::*;
                 use crate::node::NULL_NODE;
                 #[cfg(test)]
                 #[derive(Debug, Copy, Clone)]
                 pub struct IndexEntryBuilder {
                     is_first: bool,
                     is_inline: bool,
                     is_general_delta: bool,
                     version: u16,
                     offset: usize,
                     compressed_len: usize,
                     uncompressed_len: usize,
                     base_revision_or_base_of_delta_chain: Revision,
                     link_revision: Revision,
                     p1: Revision,
                     p2: Revision,
                     node: Node,
                 }
                 #[cfg(test)]
                 impl IndexEntryBuilder {
                     #[allow(clippy::new_without_default)]
                     pub fn new() -> Self {
                         Self {
                             is_first: false,
                             is_inline: false,
                             is_general_delta: true,
                             version: 1,
                             offset: 0,
                             compressed_len: 0,
                             uncompressed_len: 0,
                             base_revision_or_base_of_delta_chain: Revision(0),
                             link_revision: Revision(0),
                             p1: NULL_REVISION,
                             p2: NULL_REVISION,
                             node: NULL_NODE,
                         }
                     }
                     pub fn is_first(&mut self, value: bool) -> &mut Self {
                         self.is_first = value;
                         self
                     }
                     pub fn with_inline(&mut self, value: bool) -> &mut Self {
                         self.is_inline = value;
                         self
                     }
                     pub fn with_general_delta(&mut self, value: bool) -> &mut Self {
                         self.is_general_delta = value;
                         self
                     }
                     pub fn with_version(&mut self, value: u16) -> &mut Self {
                         self.version = value;
                         self
                     }
                     pub fn with_offset(&mut self, value: usize) -> &mut Self {
                         self.offset = value;
                         self
                     }
                     pub fn with_compressed_len(&mut self, value: usize) -> &mut Self {
                         self.compressed_len = value;
                         self
                     }
                     pub fn with_uncompressed_len(&mut self, value: usize) -> &mut Self {
                         self.uncompressed_len = value;
                         self
                     }
                     pub fn with_base_revision_or_base_of_delta_chain(
                         &mut self,
                         value: Revision,
                     ) -> &mut Self {
                         self.base_revision_or_base_of_delta_chain = value;
                         self
                     }
                     pub fn with_link_revision(&mut self, value: Revision) -> &mut Self {
                         self.link_revision = value;
                         self
                     }
                     pub fn with_p1(&mut self, value: Revision) -> &mut Self {
                         self.p1 = value;
                         self
                     }
                     pub fn with_p2(&mut self, value: Revision) -> &mut Self {
                         self.p2 = value;
                         self
                     }
                     pub fn with_node(&mut self, value: Node) -> &mut Self {
                         self.node = value;
                         self
                     }
                     pub fn build(&self) -> Vec<u8> {
                         let mut bytes = Vec::with_capacity(INDEX_ENTRY_SIZE);
                         if self.is_first {
                             bytes.extend(match (self.is_general_delta, self.is_inline) {
                                 (false, false) => [0u8, 0],
                                 (false, true) => [0u8, 1],
                                 (true, false) => [0u8, 2],
                                 (true, true) => [0u8, 3],
                             });
                             bytes.extend(self.version.to_be_bytes());
                             // Remaining offset bytes.
                             bytes.extend([0u8; 2]);
                         } else {
                             // Offset stored on 48 bits (6 bytes)
                             bytes.extend(&(self.offset as u64).to_be_bytes()[2..]);
                         }
                         bytes.extend([0u8; 2]); // Revision flags.
                         bytes.extend((self.compressed_len as u32).to_be_bytes());
                         bytes.extend((self.uncompressed_len as u32).to_be_bytes());
                         bytes.extend(
                             self.base_revision_or_base_of_delta_chain.0.to_be_bytes(),
                         );
                         bytes.extend(self.link_revision.0.to_be_bytes());
                         bytes.extend(self.p1.0.to_be_bytes());
                         bytes.extend(self.p2.0.to_be_bytes());
                         bytes.extend(self.node.as_bytes());
                         bytes.extend(vec![0u8; 12]);
                         bytes
                     }
                 }
                 pub fn is_inline(index_bytes: &[u8]) -> bool {
                     IndexHeader::parse(index_bytes)
                         .expect("too short")
                         .unwrap()
                         .format_flags()
                         .is_inline()
                 }
                 pub fn uses_generaldelta(index_bytes: &[u8]) -> bool {
                     IndexHeader::parse(index_bytes)
                         .expect("too short")
                         .unwrap()
                         .format_flags()
                         .uses_generaldelta()
                 }
                 pub fn get_version(index_bytes: &[u8]) -> u16 {
                     IndexHeader::parse(index_bytes)
                         .expect("too short")
                         .unwrap()
                         .format_version()
                 }
                 #[test]
                 fn flags_when_no_inline_flag_test() {
                     let bytes = IndexEntryBuilder::new()
                         .is_first(true)
                         .with_general_delta(false)
                         .with_inline(false)
                         .build();
                     assert!(!is_inline(&bytes));
                     assert!(!uses_generaldelta(&bytes));
                 }
                 #[test]
                 fn flags_when_inline_flag_test() {
                     let bytes = IndexEntryBuilder::new()
                         .is_first(true)
                         .with_general_delta(false)
                         .with_inline(true)
                         .build();
                     assert!(is_inline(&bytes));
                     assert!(!uses_generaldelta(&bytes));
                 }
                 #[test]
                 fn flags_when_inline_and_generaldelta_flags_test() {
                     let bytes = IndexEntryBuilder::new()
                         .is_first(true)
                         .with_general_delta(true)
                         .with_inline(true)
                         .build();
                     assert!(is_inline(&bytes));
                     assert!(uses_generaldelta(&bytes));
                 }
                 #[test]
                 fn test_offset() {
                     let bytes = IndexEntryBuilder::new().with_offset(1).build();
                     let entry = IndexEntry { bytes: &bytes };
                     assert_eq!(entry.offset(), 1)
                 }
                 #[test]
                 fn test_compressed_len() {
                     let bytes = IndexEntryBuilder::new().with_compressed_len(1).build();
                     let entry = IndexEntry { bytes: &bytes };
                     assert_eq!(entry.compressed_len(), 1)
                 }
                 #[test]
                 fn test_uncompressed_len() {
                     let bytes = IndexEntryBuilder::new().with_uncompressed_len(1).build();
                     let entry = IndexEntry { bytes: &bytes };
                     assert_eq!(entry.uncompressed_len(), 1)
                 }
                 #[test]
                 fn test_base_revision_or_base_of_delta_chain() {
                     let bytes = IndexEntryBuilder::new()
                         .with_base_revision_or_base_of_delta_chain(Revision(1))
                         .build();
                     let entry = IndexEntry { bytes: &bytes };
                     assert_eq!(entry.base_revision_or_base_of_delta_chain(), 1.into())
                 }
                 #[test]
                 fn link_revision_test() {
                     let bytes = IndexEntryBuilder::new()
                         .with_link_revision(Revision(123))
                         .build();
                     let entry = IndexEntry { bytes: &bytes };
                     assert_eq!(entry.link_revision(), 123.into());
                 }
                 #[test]
                 fn p1_test() {
                     let bytes = IndexEntryBuilder::new().with_p1(Revision(123)).build();
                     let entry = IndexEntry { bytes: &bytes };
                     assert_eq!(entry.p1(), 123.into());
                 }
                 #[test]
                 fn p2_test() {
                     let bytes = IndexEntryBuilder::new().with_p2(Revision(123)).build();
                     let entry = IndexEntry { bytes: &bytes };
                     assert_eq!(entry.p2(), 123.into());
                 }
                 #[test]
                 fn node_test() {
                     let node = Node::from_hex("0123456789012345678901234567890123456789")
                         .unwrap();
                     let bytes = IndexEntryBuilder::new().with_node(node).build();
                     let entry = IndexEntry { bytes: &bytes };
                     assert_eq!(*entry.hash(), node);
                 }
                 #[test]
                 fn version_test() {
                     let bytes = IndexEntryBuilder::new()
                         .is_first(true)
                         .with_version(2)
                         .build();
                     assert_eq!(get_version(&bytes), 2)
                 }
             }