~ubuntu-branches/ubuntu/utopic/libav/utopic-proposed

static void put_vp8_epel ## SIZE ## _h ## HTAPS ## v ## VTAPS ## _c(uint8_t *dst, ptrdiff_t dststride, uint8_t *src, ptrdiff_t srcstride, int h, int mx, int my) \

366

{ \

367

const uint8_t *filter = subpel_filters[mx-1]; \

368

const uint8_t *cm = ff_cropTbl + MAX_NEG_CROP; \

369

int x, y; \

370

uint8_t tmp_array[(2*SIZE+VTAPS-1)*SIZE]; \

371

uint8_t *tmp = tmp_array; \

372

src -= (2-(VTAPS==4))*srcstride; \

373

374

for (y = 0; y < h+VTAPS-1; y++) { \

375

for (x = 0; x < SIZE; x++) \

376

tmp[x] = FILTER_ ## HTAPS ## TAP(src, filter, 1); \

377

tmp += SIZE; \

378

src += srcstride; \

379

} \

380

381

tmp = tmp_array + (2-(VTAPS==4))*SIZE; \

382

filter = subpel_filters[my-1]; \

383

384

for (y = 0; y < h; y++) { \

385

for (x = 0; x < SIZE; x++) \

386

dst[x] = FILTER_ ## VTAPS ## TAP(tmp, filter, SIZE); \

387

dst += dststride; \

388

tmp += SIZE; \

389

} \

487

#define FILTER_6TAP(src, F, stride) \

488

cm[(F[2] * src[x + 0 * stride] - F[1] * src[x - 1 * stride] + \

489

F[0] * src[x - 2 * stride] + F[3] * src[x + 1 * stride] - \

490

F[4] * src[x + 2 * stride] + F[5] * src[x + 3 * stride] + 64) >> 7]

491

492

#define FILTER_4TAP(src, F, stride) \

493

cm[(F[2] * src[x + 0 * stride] - F[1] * src[x - 1 * stride] + \

494

F[3] * src[x + 1 * stride] - F[4] * src[x + 2 * stride] + 64) >> 7]

495

496

#define VP8_EPEL_H(SIZE, TAPS) \

497

static void put_vp8_epel ## SIZE ## _h ## TAPS ## _c(uint8_t *dst, \

498

ptrdiff_t dststride, \

499

uint8_t *src, \

500

ptrdiff_t srcstride, \

501

int h, int mx, int my) \

502

{ \

503

const uint8_t *filter = subpel_filters[mx - 1]; \

504

const uint8_t *cm = ff_crop_tab + MAX_NEG_CROP; \

505

int x, y; \

506

for (y = 0; y < h; y++) { \

507

for (x = 0; x < SIZE; x++) \

508

dst[x] = FILTER_ ## TAPS ## TAP(src, filter, 1); \

509

dst += dststride; \

510

src += srcstride; \

511

} \

512

}

513

514

#define VP8_EPEL_V(SIZE, TAPS) \

515

static void put_vp8_epel ## SIZE ## _v ## TAPS ## _c(uint8_t *dst, \

516

ptrdiff_t dststride, \

517

uint8_t *src, \

518

ptrdiff_t srcstride, \

519

int h, int mx, int my) \

520

{ \

521

const uint8_t *filter = subpel_filters[my - 1]; \

522

const uint8_t *cm = ff_crop_tab + MAX_NEG_CROP; \

523

int x, y; \

524

for (y = 0; y < h; y++) { \

525

for (x = 0; x < SIZE; x++) \

526

dst[x] = FILTER_ ## TAPS ## TAP(src, filter, srcstride); \

527

dst += dststride; \

528

src += srcstride; \

529

} \

530

}

531

532

#define VP8_EPEL_HV(SIZE, HTAPS, VTAPS) \

533

static void \

534

put_vp8_epel ## SIZE ## _h ## HTAPS ## v ## VTAPS ## _c(uint8_t *dst, \

535

ptrdiff_t dststride, \

536

uint8_t *src, \

537

ptrdiff_t srcstride, \

538

int h, int mx, \

539

int my) \

540

{ \

541

const uint8_t *filter = subpel_filters[mx - 1]; \

542

const uint8_t *cm = ff_crop_tab + MAX_NEG_CROP; \

543

int x, y; \

544

uint8_t tmp_array[(2 * SIZE + VTAPS - 1) * SIZE]; \

545

uint8_t *tmp = tmp_array; \

546

src -= (2 - (VTAPS == 4)) * srcstride; \

547

548

for (y = 0; y < h + VTAPS - 1; y++) { \

549

for (x = 0; x < SIZE; x++) \

550

tmp[x] = FILTER_ ## HTAPS ## TAP(src, filter, 1); \

551

tmp += SIZE; \

552

src += srcstride; \

553

} \

554

tmp = tmp_array + (2 - (VTAPS == 4)) * SIZE; \

555

filter = subpel_filters[my - 1]; \

556

557

for (y = 0; y < h; y++) { \

558

for (x = 0; x < SIZE; x++) \

559

dst[x] = FILTER_ ## VTAPS ## TAP(tmp, filter, SIZE); \

560

dst += dststride; \

561

tmp += SIZE; \

562

} \

390

563

}

391

564

392

565

VP8_EPEL_H(16, 4)

401

574

VP8_EPEL_V(16, 6)

402

575

VP8_EPEL_V(8, 6)

403

576

VP8_EPEL_V(4, 6)

577

404

578

VP8_EPEL_HV(16, 4, 4)

405

579

VP8_EPEL_HV(8, 4, 4)

406

580

VP8_EPEL_HV(4, 4, 4)

414

588

VP8_EPEL_HV(8, 6, 6)

415

589

VP8_EPEL_HV(4, 6, 6)

416

590

417

#define VP8_BILINEAR(SIZE) \

418

static void put_vp8_bilinear ## SIZE ## _h_c(uint8_t *dst, ptrdiff_t dstride, uint8_t *src, ptrdiff_t sstride, int h, int mx, int my) \

419

{ \

420

int a = 8-mx, b = mx; \

421

int x, y; \

422

423

for (y = 0; y < h; y++) { \

424

for (x = 0; x < SIZE; x++) \

425

dst[x] = (a*src[x] + b*src[x+1] + 4) >> 3; \

426

dst += dstride; \

427

src += sstride; \

428

} \

429

} \

430

static void put_vp8_bilinear ## SIZE ## _v_c(uint8_t *dst, ptrdiff_t dstride, uint8_t *src, ptrdiff_t sstride, int h, int mx, int my) \

431

{ \

432

int c = 8-my, d = my; \

433

int x, y; \

434

435

for (y = 0; y < h; y++) { \

436

for (x = 0; x < SIZE; x++) \

437

dst[x] = (c*src[x] + d*src[x+sstride] + 4) >> 3; \

438

dst += dstride; \

439

src += sstride; \

440

} \

441

} \

442

443

static void put_vp8_bilinear ## SIZE ## _hv_c(uint8_t *dst, ptrdiff_t dstride, uint8_t *src, ptrdiff_t sstride, int h, int mx, int my) \

444

{ \

445

int a = 8-mx, b = mx; \

446

int c = 8-my, d = my; \

447

int x, y; \

448

uint8_t tmp_array[(2*SIZE+1)*SIZE]; \

449

uint8_t *tmp = tmp_array; \

450

451

for (y = 0; y < h+1; y++) { \

452

for (x = 0; x < SIZE; x++) \

453

tmp[x] = (a*src[x] + b*src[x+1] + 4) >> 3; \

454

tmp += SIZE; \

455

src += sstride; \

456

} \

457

458

tmp = tmp_array; \

459

460

for (y = 0; y < h; y++) { \

461

for (x = 0; x < SIZE; x++) \

462

dst[x] = (c*tmp[x] + d*tmp[x+SIZE] + 4) >> 3; \

463

dst += dstride; \

464

tmp += SIZE; \

465

} \

591

#define VP8_BILINEAR(SIZE) \

592

static void put_vp8_bilinear ## SIZE ## _h_c(uint8_t *dst, ptrdiff_t dstride, \

593

uint8_t *src, ptrdiff_t sstride, \

594

int h, int mx, int my) \

595

{ \

596

int a = 8 - mx, b = mx; \

597

int x, y; \

598

for (y = 0; y < h; y++) { \

599

for (x = 0; x < SIZE; x++) \

600

dst[x] = (a * src[x] + b * src[x + 1] + 4) >> 3; \

601

dst += dstride; \

602

src += sstride; \

603

} \

604

} \

605

606

static void put_vp8_bilinear ## SIZE ## _v_c(uint8_t *dst, ptrdiff_t dstride, \

607

uint8_t *src, ptrdiff_t sstride, \

608

int h, int mx, int my) \

609

{ \

610

int c = 8 - my, d = my; \

611

int x, y; \

612

for (y = 0; y < h; y++) { \

613

for (x = 0; x < SIZE; x++) \

614

dst[x] = (c * src[x] + d * src[x + sstride] + 4) >> 3; \

615

dst += dstride; \

616

src += sstride; \

617

} \

618

} \

619

620

static void put_vp8_bilinear ## SIZE ## _hv_c(uint8_t *dst, \

621

ptrdiff_t dstride, \

622

uint8_t *src, \

623

ptrdiff_t sstride, \

624

int h, int mx, int my) \

625

{ \

626

int a = 8 - mx, b = mx; \

627

int c = 8 - my, d = my; \

628

int x, y; \

629

uint8_t tmp_array[(2 * SIZE + 1) * SIZE]; \

630

uint8_t *tmp = tmp_array; \

631

for (y = 0; y < h + 1; y++) { \

632

for (x = 0; x < SIZE; x++) \

633

tmp[x] = (a * src[x] + b * src[x + 1] + 4) >> 3; \

634

tmp += SIZE; \

635

src += sstride; \

636

} \

637

tmp = tmp_array; \

638

for (y = 0; y < h; y++) { \

639

for (x = 0; x < SIZE; x++) \

640

dst[x] = (c * tmp[x] + d * tmp[x + SIZE] + 4) >> 3; \

641

dst += dstride; \

642

tmp += SIZE; \

643

} \

466

644

}

467

645

468

646

VP8_BILINEAR(16)

469

647

VP8_BILINEAR(8)

470

648

VP8_BILINEAR(4)

471

649

472

#define VP8_MC_FUNC(IDX, SIZE) \

473

dsp->put_vp8_epel_pixels_tab[IDX][0][0] = put_vp8_pixels ## SIZE ## _c; \

474

dsp->put_vp8_epel_pixels_tab[IDX][0][1] = put_vp8_epel ## SIZE ## _h4_c; \

475

dsp->put_vp8_epel_pixels_tab[IDX][0][2] = put_vp8_epel ## SIZE ## _h6_c; \

476

dsp->put_vp8_epel_pixels_tab[IDX][1][0] = put_vp8_epel ## SIZE ## _v4_c; \

650

#define VP78_MC_FUNC(IDX, SIZE) \

651

dsp->put_vp8_epel_pixels_tab[IDX][0][0] = put_vp8_pixels ## SIZE ## _c; \

652

dsp->put_vp8_epel_pixels_tab[IDX][0][1] = put_vp8_epel ## SIZE ## _h4_c; \

653

dsp->put_vp8_epel_pixels_tab[IDX][0][2] = put_vp8_epel ## SIZE ## _h6_c; \

654

dsp->put_vp8_epel_pixels_tab[IDX][1][0] = put_vp8_epel ## SIZE ## _v4_c; \

477

655

dsp->put_vp8_epel_pixels_tab[IDX][1][1] = put_vp8_epel ## SIZE ## _h4v4_c; \

478

656

dsp->put_vp8_epel_pixels_tab[IDX][1][2] = put_vp8_epel ## SIZE ## _h6v4_c; \

479

dsp->put_vp8_epel_pixels_tab[IDX][2][0] = put_vp8_epel ## SIZE ## _v6_c; \

657

dsp->put_vp8_epel_pixels_tab[IDX][2][0] = put_vp8_epel ## SIZE ## _v6_c; \

480

658

dsp->put_vp8_epel_pixels_tab[IDX][2][1] = put_vp8_epel ## SIZE ## _h4v6_c; \

481

659

dsp->put_vp8_epel_pixels_tab[IDX][2][2] = put_vp8_epel ## SIZE ## _h6v6_c

482

660

483

#define VP8_BILINEAR_MC_FUNC(IDX, SIZE) \

484

dsp->put_vp8_bilinear_pixels_tab[IDX][0][0] = put_vp8_pixels ## SIZE ## _c; \

661

#define VP78_BILINEAR_MC_FUNC(IDX, SIZE) \

662

dsp->put_vp8_bilinear_pixels_tab[IDX][0][0] = put_vp8_pixels ## SIZE ## _c; \

485

663

dsp->put_vp8_bilinear_pixels_tab[IDX][0][1] = put_vp8_bilinear ## SIZE ## _h_c; \

486

664

dsp->put_vp8_bilinear_pixels_tab[IDX][0][2] = put_vp8_bilinear ## SIZE ## _h_c; \

487

665

dsp->put_vp8_bilinear_pixels_tab[IDX][1][0] = put_vp8_bilinear ## SIZE ## _v_c; \

491

669

dsp->put_vp8_bilinear_pixels_tab[IDX][2][1] = put_vp8_bilinear ## SIZE ## _hv_c; \

492

670

dsp->put_vp8_bilinear_pixels_tab[IDX][2][2] = put_vp8_bilinear ## SIZE ## _hv_c

493

671

672

av_cold void ff_vp78dsp_init(VP8DSPContext *dsp)

673

{

674

VP78_MC_FUNC(0, 16);

675

VP78_MC_FUNC(1, 8);

676

VP78_MC_FUNC(2, 4);

677

678

VP78_BILINEAR_MC_FUNC(0, 16);

679

VP78_BILINEAR_MC_FUNC(1, 8);

680

VP78_BILINEAR_MC_FUNC(2, 4);

681

682

if (ARCH_ARM)

683

ff_vp78dsp_init_arm(dsp);

684

if (ARCH_PPC)

685

ff_vp78dsp_init_ppc(dsp);

686

if (ARCH_X86)

687

ff_vp78dsp_init_x86(dsp);

688

}

689

690

#if CONFIG_VP7_DECODER

691

LOOP_FILTERS(vp7)

692

693

av_cold void ff_vp7dsp_init(VP8DSPContext *dsp)

694

{

695

dsp->vp8_luma_dc_wht = vp7_luma_dc_wht_c;

696

dsp->vp8_luma_dc_wht_dc = vp7_luma_dc_wht_dc_c;

697

dsp->vp8_idct_add = vp7_idct_add_c;

698

dsp->vp8_idct_dc_add = vp7_idct_dc_add_c;

699

dsp->vp8_idct_dc_add4y = vp7_idct_dc_add4y_c;

700

dsp->vp8_idct_dc_add4uv = vp7_idct_dc_add4uv_c;

701

702

dsp->vp8_v_loop_filter16y = vp7_v_loop_filter16_c;

703

dsp->vp8_h_loop_filter16y = vp7_h_loop_filter16_c;

704

dsp->vp8_v_loop_filter8uv = vp7_v_loop_filter8uv_c;

705

dsp->vp8_h_loop_filter8uv = vp7_h_loop_filter8uv_c;

706

707

dsp->vp8_v_loop_filter16y_inner = vp7_v_loop_filter16_inner_c;

708

dsp->vp8_h_loop_filter16y_inner = vp7_h_loop_filter16_inner_c;

709

dsp->vp8_v_loop_filter8uv_inner = vp7_v_loop_filter8uv_inner_c;

710

dsp->vp8_h_loop_filter8uv_inner = vp7_h_loop_filter8uv_inner_c;

711

712

dsp->vp8_v_loop_filter_simple = vp7_v_loop_filter_simple_c;

713

dsp->vp8_h_loop_filter_simple = vp7_h_loop_filter_simple_c;

714

}

715

#endif /* CONFIG_VP7_DECODER */

716

717

#if CONFIG_VP8_DECODER

718

LOOP_FILTERS(vp8)

719

494

720

av_cold void ff_vp8dsp_init(VP8DSPContext *dsp)

495

721

{

496

722

dsp->vp8_luma_dc_wht = vp8_luma_dc_wht_c;

513

739

dsp->vp8_v_loop_filter_simple = vp8_v_loop_filter_simple_c;

514

740

dsp->vp8_h_loop_filter_simple = vp8_h_loop_filter_simple_c;

515

741

516

VP8_MC_FUNC(0, 16);

517

VP8_MC_FUNC(1, 8);

518

VP8_MC_FUNC(2, 4);

519

520

VP8_BILINEAR_MC_FUNC(0, 16);

521

VP8_BILINEAR_MC_FUNC(1, 8);

522

VP8_BILINEAR_MC_FUNC(2, 4);

523

524

742

if (ARCH_ARM)

525

743

ff_vp8dsp_init_arm(dsp);

526

if (ARCH_PPC)

527

ff_vp8dsp_init_ppc(dsp);

528

744

if (ARCH_X86)

529

745

ff_vp8dsp_init_x86(dsp);

530

746

}

747

#endif /* CONFIG_VP8_DECODER */

Older »